openGauss-server/src/gausskernel/storage/replication/walsender.cpp

/* -------------------------------------------------------------------------
 *
 * walsender.cpp
 *
 * The WAL sender process (walsender) is new as of Postgres 9.0. It takes
 * care of sending XLOG from the primary server to a single recipient.
 * (Note that there can be more than one walsender process concurrently.)
 * It is started by the postmaster when the walreceiver of a standby server
 * connects to the primary server and requests XLOG streaming replication.
 * It attempts to keep reading XLOG records from the disk and sending them
 * to the standby server, as long as the connection is alive (i.e., like
 * any backend, there is a one-to-one relationship between a connection
 * and a walsender process).
 *
 * Normal termination is by SIGTERM, which instructs the walsender to
 * close the connection and exit(0) at next convenient moment. Emergency
 * termination is by SIGQUIT; like any backend, the walsender will simply
 * abort and exit on SIGQUIT. A close of the connection and a FATAL error
 * are treated as not a crash but approximately normal termination;
 * the walsender will exit quickly without sending any more XLOG records.
 *
 * If the server is shut down, postmaster sends us SIGUSR2 after all
 * regular backends have exited and the shutdown checkpoint has been written.
 * This instruct walsender to send any outstanding WAL, including the
 * shutdown checkpoint record, wait for it to be replicated to the standby,
 * and then exit.
 *
 *
 * Portions Copyright (c) 2020 Huawei Technologies Co.,Ltd.
 * Portions Copyright (c) 2010-2012, PostgreSQL Global Development Group
 *
 * IDENTIFICATION
 *	  src/gausskernel/storage/replication/walsender.cpp
 *
 * -------------------------------------------------------------------------
 */

#define __STDC_FORMAT_MACROS
#include <inttypes.h>
#include <math.h>
#include "postgres.h"
#include "knl/knl_variable.h"

#include <signal.h>
#include <unistd.h>
#ifdef HAVE_NETINET_TCP_H
#include <netinet/tcp.h>
#endif
#include <arpa/inet.h>
#ifndef WIN32
#include <syscall.h>
#endif
#include <sys/stat.h>

#include "access/cbmparsexlog.h"
#include "access/transam.h"
#include "access/xlog_internal.h"
#include "access/xact.h"
#include "access/xlog.h"
#include "access/xlogutils.h"
#include "catalog/pg_authid.h"
#include "catalog/pg_type.h"
#include "cjson/cJSON.h"
#include "commands/dbcommands.h"
#include "funcapi.h"
#include "libpq/libpq.h"
#include "libpq/pqformat.h"
#include "libpq/pqsignal.h"
#include "miscadmin.h"
#include "nodes/replnodes.h"
#include "pgstat.h"
#include "replication/basebackup.h"
#include "replication/catchup.h"
#include "replication/decode.h"
#include "replication/logical.h"
#include "replication/slot.h"
#include "replication/snapbuild.h"
#include "replication/syncrep.h"
#include "replication/walprotocol.h"
#include "replication/walreceiver.h"
#include "replication/walsender.h"
#include "replication/walsender_private.h"
#include "replication/datasender.h"
#include "replication/dataqueue.h"
#include "replication/dcf_flowcontrol.h"
#include "replication/dcf_replication.h"
#include "replication/parallel_decode.h"
#include "replication/parallel_decode_worker.h"
#include "replication/parallel_reorderbuffer.h"
#include "replication/ss_cluster_replication.h"
#include "storage/buf/bufmgr.h"
#include "storage/smgr/fd.h"
#include "storage/ipc.h"
#include "storage/pmsignal.h"
#include "storage/proc.h"
#include "storage/procarray.h"
#include "storage/lmgr.h"
#include "storage/xlog_share_storage/xlog_share_storage.h"
#include "storage/file/fio_device.h"
#include "tcop/tcopprot.h"
#include "utils/acl.h"
#include "utils/builtins.h"
#include "utils/elog.h"
#include "utils/guc.h"
#include "utils/memutils.h"
#include "utils/ps_status.h"
#include "utils/resowner.h"
#include "utils/timestamp.h"
#include "auditfuncs.h"
#include "gssignal/gs_signal.h"
#include "postmaster/postmaster.h"
#include "alarm/alarm.h"
#include "utils/distribute_test.h"
#include "gs_bbox.h"
#include "lz4.h"

#define InvalidPid ((ThreadId)(-1))

#define CRC_LEN 11

extern void *internal_load_library(const char *libname);
extern char *expand_dynamic_library_name(const char *name);
extern bool PMstateIsRun(void);

#define NAPTIME_PER_CYCLE 100 /* max sleep time between cycles (100ms) */
bool WalSegmemtRemovedhappened = false;
volatile bool bSyncStat = false;
volatile bool bSyncStatStatBefore = false;
long g_logical_slot_sleep_time = 0;
static int g_appname_extra_len = 3; /* [+]+\0 */


#define AmWalSenderToDummyStandby() (t_thrd.walsender_cxt.MyWalSnd->sendRole == SNDROLE_PRIMARY_DUMMYSTANDBY)
#define AmWalSenderOnDummyStandby() (t_thrd.walsender_cxt.MyWalSnd->sendRole == SNDROLE_DUMMYSTANDBY_STANDBY)

#define AmWalSenderToStandby() (t_thrd.walsender_cxt.MyWalSnd->sendRole == SNDROLE_PRIMARY_STANDBY)

#define USE_PHYSICAL_XLOG_SEND \
    (AM_WAL_HADR_SENDER || !SS_REPLICATION_DORADO_CLUSTER || !IS_SHARED_STORAGE_MODE || (walsnd->sendRole == SNDROLE_PRIMARY_BUILDSTANDBY))
#define USE_SYNC_REP_FLUSH_PTR (AM_WAL_HADR_SENDER && (!IS_SHARED_STORAGE_MODE && !SS_REPLICATION_DORADO_CLUSTER))

/* Statistics for log control */
static const int MICROSECONDS_PER_SECONDS = 1000000;
static const int MILLISECONDS_PER_SECONDS = 1000;
static const int MILLISECONDS_PER_MICROSECONDS = 1000;
static const int INIT_CONTROL_REPLY = 3;
static const int MAX_CONTROL_REPLY = 1000;
static const int SLEEP_MORE = 400;
static const int SLEEP_LESS = 400;
static const int NODENAMELEN = 1024;
static const int SHIFT_SPEED = 3;
static const int EAGER_MODE_MULTIPLE = 20;
static const int CALCULATE_INTERVAL_MILLISECOND = 2000;
#define NEED_CALCULATE_RTO \
    (((IS_PGXC_DATANODE && t_thrd.postmaster_cxt.HaShmData->current_mode == PRIMARY_MODE) || AM_WAL_HADR_CN_SENDER) \
        && ((walsnd->log_ctrl.sleep_count % walsnd->log_ctrl.sleep_count_limit) == 0 || forceUpdate))

typedef struct {
    bool replicationStarted;
    bool messageReceiveNoTimeout;
} ReplicationCxt;

/* Signal handlers */
static void WalSndSigHupHandler(SIGNAL_ARGS);
static void WalSndShutdownHandler(SIGNAL_ARGS);
static void WalSndQuickDieHandler(SIGNAL_ARGS);
static void WalSndXLogSendHandler(SIGNAL_ARGS);
static void WalSndLastCycleHandler(SIGNAL_ARGS);

static void IdentifyCommand(Node* cmd_node, ReplicationCxt* repCxt, const char *cmd_string);
static void HandleWalReplicationCommand(const char *cmd_string, ReplicationCxt* repCxt);
typedef void (*WalSndSendDataCallback)(void);
static int WalSndLoop(WalSndSendDataCallback send_data);
static void InitWalSnd(void);
static void WalSndHandshake(void);
static void WalSndKill(int code, Datum arg);
static void XLogSendPhysical(void);
static void XLogSendLogical(void);
static void IdentifySystem(void);
static void IdentifyVersion(void);
static void IdentifyConsistence(IdentifyConsistenceCmd *cmd);
static void IdentifyChannel(IdentifyChannelCmd *cmd);
static void CreateReplicationSlot(CreateReplicationSlotCmd *cmd);
static void DropReplicationSlot(DropReplicationSlotCmd *cmd);
static void StartReplication(StartReplicationCmd *cmd);
static void StartLogicalReplication(StartReplicationCmd *cmd);
static void AdvanceLogicalReplication(AdvanceReplicationCmd *cmd);
static void ProcessStandbyMessage(void);
static void ProcessStandbyReplyMessage(void);
static void ProcessStandbyHSFeedbackMessage(void);
static void ProcessStandbySwitchRequestMessage(void);
static void ProcessRepliesIfAny(void);
static void ProcessLogCtrl(StandbyReplyMessage reply);
static bool LogicalSlotSleepFlag(void);
static void LogCtrlDoActualSleep(volatile WalSnd *walsnd, bool forceUpdate);
static void LogCtrlExecuteSleeping(volatile WalSnd *walsnd, bool forceUpdate, bool logicalSlotSleepFlag);
static void LogCtrlCountSleepLimit(void);
static void LogCtrlSleep(void);
static void LogCtrlCalculateCurrentRTO(StandbyReplyMessage *reply, bool *needRefresh);
static void LogCtrlCalculateCurrentRPO(StandbyReplyMessage *reply);
#ifdef ENABLE_MULTIPLE_NODES
static void LogCtrlCalculateHadrCurrentRPO(void);
#endif
static void LogCtrlCalculateSleepTime(int64 logCtrlSleepTime, int64 balanceSleepTime, const bool isHadrRPO);
static void WalSndKeepalive(bool requestReply);
static void WalSndRmXLog(bool requestReply);
static void WalSndSyncDummyStandbyDone(bool requestReply);
static void WalSndKeepaliveIfNecessary(TimestampTz now);
static void WalSndResponseSwitchover(char *msgbuf);
static void SetHaWalSenderChannel(void);
static void SetReplWalSender(void);
static bool SendConfigFile(char *path);
static void ProcessStandbyFileTimeMessage(void);

static long WalSndComputeSleeptime(TimestampTz now);
static void WalSndCheckTimeOut(TimestampTz now);
static void WalSndWriteLogicalAdvanceXLog(TimestampTz now);

static void WalSndPrepareWrite(LogicalDecodingContext *ctx, XLogRecPtr lsn, TransactionId xid, bool last_write);
static void WalSndWriteData(LogicalDecodingContext *ctx, XLogRecPtr lsn, TransactionId xid, bool last_write);
static XLogRecPtr WalSndWaitForWal(XLogRecPtr loc);

static void XLogRead(char *buf, XLogRecPtr startptr, Size count);

static void SetWalSndPeerMode(ServerMode mode);
static void SetWalSndPeerDbstate(DbState state);

static void ChooseStartPointForDummyStandby(void);
static bool WalSndCaughtup(void);
static bool WalSndDummyLEStandby(void);
static void WalSndShutdown(void) __attribute__((noreturn));

static bool UpdateHaWalSenderChannel(int ha_remote_listen_port);
static bool IsWalSenderToBuild(void);
static void WalSndSetPercentCountStartLsn(XLogRecPtr startLsn);
static void WalSndRefreshPercentCountStartLsn(XLogRecPtr currentMaxLsn, XLogRecPtr currentDoneLsn);
static void set_xlog_location(ServerMode local_role, XLogRecPtr* sndWrite, XLogRecPtr* sndFlush, XLogRecPtr* sndReplay);
static void ProcessArchiveFeedbackMessage(void);
static void WalSndArchiveXlog(ArchiveXlogMessage *archive_message);
static ArchiveXlogMessage* get_archive_task_from_list();
static void CalCatchupRate();
static void WalSndHadrSwitchoverRequest();
static void ProcessHadrSwitchoverMessage();
static void ProcessHadrReplyMessage();
static int WalSndTimeout();


char *DataDir = ".";

static void XLogSendLSN(void)
{
    PrimaryKeepaliveMessage keepalive_message;
    volatile HaShmemData* hashmdata = t_thrd.postmaster_cxt.HaShmData;
    errno_t errorno = EOK;
    static XLogRecPtr lastSendPtr = 0;
    static uint32 sendCount = 0;
    const uint32 maxWaitCount = 1000;
    const uint32 maxWaitXLoginterval = 1024 * 1024 * 4;

    /* Construct a new message */
    SpinLockAcquire(&hashmdata->mutex);
    keepalive_message.peer_role = hashmdata->current_mode;
    SpinLockRelease(&hashmdata->mutex);
    keepalive_message.peer_state = get_local_dbstate();
    if (PRIMARY_MODE == keepalive_message.peer_role || NORMAL_MODE == keepalive_message.peer_role) {
        ShareStorageXLogCtl *ctlInfo = AlignAllocShareStorageCtl();
        ReadShareStorageCtlInfo(ctlInfo);
        keepalive_message.walEnd = ctlInfo->insertHead;
        AlignFreeShareStorageCtl(ctlInfo);
    } else {
        /* Local role is not a primary */
        keepalive_message.walEnd = GetStandbyFlushRecPtr(NULL);
    }

    t_thrd.walsender_cxt.sentPtr = keepalive_message.walEnd;
    /* Update shared memory status */
    {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
        SpinLockAcquire(&walsnd->mutex);
        walsnd->sentPtr = t_thrd.walsender_cxt.sentPtr;
        SpinLockRelease(&walsnd->mutex);
    }
    if (lastSendPtr == keepalive_message.walEnd) {
        return;
    } else if ((keepalive_message.walEnd < lastSendPtr + maxWaitXLoginterval) && (sendCount < maxWaitCount)) {
        sendCount++;
        return;
    }
    WalSndSetState(WALSNDSTATE_STREAMING);
    sendCount = 0;
    lastSendPtr = keepalive_message.walEnd;
    keepalive_message.sendTime = GetCurrentTimestamp();
    keepalive_message.replyRequested = false;
    keepalive_message.catchup = (t_thrd.walsender_cxt.MyWalSnd->state == WALSNDSTATE_CATCHUP);
    ereport(DEBUG2, (errmsg("sending wal replication keepalive")));
    t_thrd.walsender_cxt.walSndCaughtUp = true;
    t_thrd.walsender_cxt.catchup_threshold = 0;
    /* Prepend with the message type and send it. */
    t_thrd.walsender_cxt.output_xlog_message[0] = 'k';
    errorno = memcpy_s(t_thrd.walsender_cxt.output_xlog_message + 1,
        sizeof(WalDataMessageHeader) + g_instance.attr.attr_storage.MaxSendSize * 1024, &keepalive_message,
        sizeof(PrimaryKeepaliveMessage));
    securec_check(errorno, "\0", "\0");
    (void)pq_putmessage_noblock('d', t_thrd.walsender_cxt.output_xlog_message, sizeof(PrimaryKeepaliveMessage) + 1);
    /* Flush the keepalive message to standby immediately. */
    if (pq_flush_if_writable() != 0)
        WalSndShutdown();
}


void SetReportAppName(SndRole sendRole)
{
    char* appName = NULL;
    const char* appNameType = NULL;
    size_t appNameSize;
    int nRet = 0;

    if (sendRole == SNDROLE_PRIMARY_DUMMYSTANDBY) {
        appNameType = "WalSender to Secondary";
    } else if (sendRole == SNDROLE_PRIMARY_BUILDSTANDBY) {
        appNameType = "WalSender to Build";
    } else if (sendRole == SNDROLE_PRIMARY_STANDBY) {
        appNameType = "WalSender to Standby";
    } else {
        /* appname is not required */
        return;
    }

    appNameSize = strlen(appNameType) + strlen(u_sess->attr.attr_common.application_name) + g_appname_extra_len;
    appName = (char*)palloc(appNameSize);
    nRet = snprintf_s(appName, appNameSize, appNameSize - 1,
                      "%s[%s]", appNameType, u_sess->attr.attr_common.application_name);
    securec_check_ss(nRet, "\0", "\0");
    pgstat_report_appname(appName);
    pfree_ext(appName);
}

/* Main entry point for walsender process */
int WalSenderMain(void)
{
    MemoryContext walsnd_context;
    int nRet = 0;

    t_thrd.proc_cxt.MyProgName = "WalSender";
    (void)ShowThreadName("WalSender");
    if (RecoveryInProgress()) {
        t_thrd.role = WAL_STANDBY_SENDER;
    }

    if (g_threadPoolControler && !AM_WAL_DB_SENDER) {
        ereport(INFO, (errmsg("Try to bind walsender thread to available CPUs in threadpool.")));
        g_threadPoolControler->BindThreadToAllAvailCpu(t_thrd.proc_cxt.MyProcPid);
    }

    /* Create a per-walsender data structure in shared memory */
    InitWalSnd();

    ereport(LOG, (errmsg("walsender thread started")));
    /*
     * Create a memory context that we will do all our work in.  We do this so
     * that we can reset the context during error recovery and thereby avoid
     * possible memory leaks.  Formerly this code just ran in
     * t_thrd.top_mem_cxt, but resetting that would be a really bad idea.
     *
     * XXX: we don't actually attempt error recovery in walsender, we just
     * close the connection and exit.
     */
    walsnd_context = AllocSetContextCreate(t_thrd.top_mem_cxt, "Wal Sender", ALLOCSET_DEFAULT_MINSIZE,
                                           ALLOCSET_DEFAULT_INITSIZE, ALLOCSET_DEFAULT_MAXSIZE);
    t_thrd.mem_cxt.msg_mem_cxt = AllocSetContextCreate(t_thrd.top_mem_cxt,
                                                       "MessageContext",
                                                       ALLOCSET_DEFAULT_MINSIZE,
                                                       ALLOCSET_DEFAULT_INITSIZE,
                                                       ALLOCSET_DEFAULT_MAXSIZE);

    t_thrd.mem_cxt.mask_password_mem_cxt = AllocSetContextCreate(t_thrd.top_mem_cxt,
                                                                 "MaskPasswordCtx",
                                                                 ALLOCSET_DEFAULT_MINSIZE,
                                                                 ALLOCSET_DEFAULT_INITSIZE,
                                                                 ALLOCSET_DEFAULT_MAXSIZE);

#if (!defined(ENABLE_MULTIPLE_NODES)) && (!defined(ENABLE_PRIVATEGAUSS))
    if (AM_WAL_DB_SENDER) {
        LoadSqlPlugin();
    }
#endif

    (void)MemoryContextSwitchTo(walsnd_context);

    /* Set up resource owner */
    t_thrd.utils_cxt.CurrentResourceOwner = ResourceOwnerCreate(NULL, "walsender top-level resource owner",
        THREAD_GET_MEM_CXT_GROUP(MEMORY_CONTEXT_STORAGE));

    /*
     * Let postmaster know that we're streaming. Once we've declared us as a
     * WAL sender process, postmaster will let us outlive the bgwriter and
     * kill us last in the shutdown sequence, so we get a chance to stream all
     * remaining WAL at shutdown, including the shutdown checkpoint. Note that
     * there's no going back, and we mustn't write any WAL records after this.
     */
    MarkPostmasterChildWalSender();
    SendPostmasterSignal(PMSIGNAL_ADVANCE_STATE_MACHINE);

    /* Unblock signals (they were blocked when the postmaster forked us) */
    gs_signal_setmask(&t_thrd.libpq_cxt.UnBlockSig, NULL);

    if (SS_IN_REFORM || SS_NORMAL_STANDBY) {
        ereport(ERROR, (errmsg("Can't start replication during reform or on DMS standby mode!")));
    }

    /*
     * Use the recovery target timeline ID during recovery
     */
    if (AM_WAL_STANDBY_SENDER)
        t_thrd.xlog_cxt.ThisTimeLineID = GetRecoveryTargetTLI();

    if (dummyStandbyMode) {
        ShutdownWalRcv();
        t_thrd.xlog_cxt.ThisTimeLineID = GetRecoveryTargetTLI();
        t_thrd.xlog_cxt.recoveryTargetTLI = GetRecoveryTargetTLI();
        ereport(LOG, (errmsg("ThisTimeLineID: %u", t_thrd.xlog_cxt.ThisTimeLineID)));
    }

    /* Tell the standby that walsender is ready for receiving commands */
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());

    if (t_thrd.postmaster_cxt.HaShmData)
        t_thrd.walsender_cxt.server_run_mode = t_thrd.postmaster_cxt.HaShmData->current_mode;

    SetHaWalSenderChannel();
    Assert(t_thrd.utils_cxt.CurrentResourceOwner != NULL);
    /* Handle handshake messages before streaming */
    WalSndHandshake();

    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    /* Initialize shared memory status */
    {
        SpinLockAcquire(&walsnd->mutex);
        walsnd->pid = t_thrd.proc_cxt.MyProcPid;
#ifndef WIN32
        walsnd->lwpId = syscall(SYS_gettid);
#else
        walsnd->lwpId = (int)t_thrd.proc_cxt.MyProcPid;
#endif

        if (AM_WAL_DB_SENDER) {
            /* logical replication */
            walsnd->sentPtr = t_thrd.slot_cxt.MyReplicationSlot->data.restart_lsn;
        } else {
            /* physical replication */
            walsnd->sentPtr = t_thrd.walsender_cxt.sentPtr;
        }

        SpinLockRelease(&walsnd->mutex);

        SetReportAppName(walsnd->sendRole);
    }

    SyncRepInitConfig();

    if (t_thrd.proc_cxt.DataDir) {
        nRet = snprintf_s(t_thrd.walsender_cxt.gucconf_file, MAXPGPATH, MAXPGPATH - 1, "%s/postgresql.conf",
                          t_thrd.proc_cxt.DataDir);
        securec_check_ss(nRet, "\0", "\0");

        nRet = snprintf_s(t_thrd.walsender_cxt.gucconf_lock_file, MAXPGPATH, MAXPGPATH - 1, "%s/postgresql.conf.lock",
                          t_thrd.proc_cxt.DataDir);
        securec_check_ss(nRet, "\0", "\0");
    } else {
        ereport(ERROR, (errcode(ERRCODE_PROTOCOL_VIOLATION),
                        errmsg_internal("cannot find GAUSSDATA: %s", t_thrd.walsender_cxt.gucconf_file)));
    }

    /* init the dummy standby data num to write in wal streaming. */
    if (g_instance.attr.attr_storage.enable_mix_replication && dummyStandbyMode)
        InitWSDataNumOnDummyStandby();

    if (g_instance.attr.attr_storage.enable_mix_replication && !u_sess->attr.attr_storage.enable_cbm_tracking)
        ereport(PANIC, (errmsg("enable_cbm_tracking must be turn on when enable_mix_replication is on!")));

    /* Main loop of walsender */
    if (AM_WAL_DB_SENDER)
        return WalSndLoop(XLogSendLogical);
    else {
        if (USE_PHYSICAL_XLOG_SEND) {
            return WalSndLoop(XLogSendPhysical);
        } else {
            return WalSndLoop(XLogSendLSN);
        }
    }
}

/* check PMstate and RecoveryInProgress */
void CheckPMstateAndRecoveryInProgress(void)
{
    if (!PMstateIsRun() || RecoveryInProgress()) {
        ereport(ERROR, (errcode(ERRCODE_LOGICAL_DECODE_ERROR),
                        errmsg("can't decode in pmState is not run or recovery in progress.")));
    }
}

/*
 * Execute commands from walreceiver, until we enter streaming mode.
 */
static void WalSndHandshake(void)
{
    StringInfoData input_message;
    ReplicationCxt repCxt;

    int rc;
    rc = memset_s(&repCxt, sizeof(ReplicationCxt), 0, sizeof(ReplicationCxt));
    securec_check(rc, "\0", "\0");

    int sleeptime = 0;
    int timeout = WalSndTimeout();

    initStringInfo(&input_message);

    while (!repCxt.replicationStarted) {
        int firstchar;
        Assert(t_thrd.utils_cxt.CurrentResourceOwner != NULL);

        WalSndSetState(WALSNDSTATE_STARTUP);
        set_ps_display("idle", false);
        if (t_thrd.walsender_cxt.walsender_ready_to_stop || t_thrd.walsender_cxt.walsender_shutdown_requested) {
            ereport(LOG, (errmsg("caught ready to stop or shutdown request")));
            proc_exit(0);
        }
        /* Wait for some data to arrive */
        if (!pq_select(NAPTIME_PER_CYCLE)) {
            sleeptime += NAPTIME_PER_CYCLE;

            /*
             * not yet data available without blocking,
             * check if it is under maximum timeout
             * period
             */
            if (timeout > 0 && sleeptime >= timeout) {
                ereport(COMMERROR, (errcode(ERRCODE_PROTOCOL_VIOLATION),
                                    errmsg("No message received from standby for maximum time")));
                proc_exit(0);
            }
            continue;
        }

        sleeptime = 0;

        /*
         * Since select has indicated that data is available to read,
         * then we can call blocking function itself, as there must be
         * some data to get.
         */
        firstchar = pq_getbyte();

        /*
         * Emergency bailout if postmaster has died.  This is to avoid the
         * necessity for manual cleanup of all postmaster children.
         */
        if (!PostmasterIsAlive())
            gs_thread_exit(1);

        /*
         * Check for any other interesting events that happened while we
         * slept.
         */
        if (t_thrd.walsender_cxt.got_SIGHUP) {
            t_thrd.walsender_cxt.got_SIGHUP = false;
            ProcessConfigFile(PGC_SIGHUP);
        }

        if (firstchar != EOF) {
            /*
             * Read the message contents. This is expected to be done without
             * blocking because we've been able to get message type code.
             */
            if (pq_getmessage(&input_message, 0))
                firstchar = EOF; /* suitable message already logged */
        }

        /* Handle the very limited subset of commands expected in this phase */
        switch (firstchar) {
            case 'Q': /* Query message */
            {
                const char *query_string = NULL;

                query_string = pq_getmsgstring(&input_message);
                pq_getmsgend(&input_message);

                HandleWalReplicationCommand(query_string, &repCxt);

                if (repCxt.messageReceiveNoTimeout) {
                    timeout = 0;
                }
            } break;

            case 'X':
            case 'c':
                /* standby is closing the connection */
                proc_exit(0);
                /* fall-through */
            case 'P':
                /* standby is closing the connection */
                break;
            case EOF:
                /* standby disconnected unexpectedly */
                ereport(COMMERROR,
                        (errcode(ERRCODE_PROTOCOL_VIOLATION), errmsg("unexpected EOF on standby connection")));
                proc_exit(0);
                /* fall-through */
            default:
                ereport(FATAL, (errcode(ERRCODE_PROTOCOL_VIOLATION),
                                errmsg("invalid standby handshake message type %d", firstchar)));
        }
    }
}

/*
 * IDENTIFY_SYSTEM
 */
static void IdentifySystem(void)
{
    StringInfoData buf;
    char sysid[32];
    char tli[11];
    char xpos[MAXFNAMELEN];
    XLogRecPtr logptr;
    int rc = 0;
    char *dbname = NULL;

    /*
     * Reply with a result set with one row, four columns. First col is system
     * ID, second is timeline ID, third is current xlog location and the fourth
     * contains the database name if we are connected to one.
     */
    rc = snprintf_s(sysid, sizeof(sysid), sizeof(sysid) - 1, UINT64_FORMAT, GetSystemIdentifier());
    securec_check_ss(rc, "\0", "\0");

    rc = snprintf_s(tli, sizeof(tli), sizeof(tli) - 1, "%u", t_thrd.xlog_cxt.ThisTimeLineID);
    securec_check_ss(rc, "\0", "\0");

    logptr = AM_WAL_STANDBY_SENDER ? GetStandbyFlushRecPtr(NULL) : GetFlushRecPtr();

    rc = snprintf_s(xpos, sizeof(xpos), sizeof(xpos) - 1, "%X/%X", (uint32)(logptr >> 32), (uint32)logptr);
    securec_check_ss(rc, "\0", "\0");

    if (u_sess->proc_cxt.MyDatabaseId != InvalidOid) {
        MemoryContext cur = CurrentMemoryContext;

        /* syscache access needs a transaction env. */
        StartTransactionCommand();
        /* make dbname live outside TX context */
        (void)MemoryContextSwitchTo(cur);
        dbname = get_database_name(u_sess->proc_cxt.MyDatabaseId);
        if (dbname == NULL) {
            ereport(ERROR, (errcode(ERRCODE_UNDEFINED_DATABASE),
                            errmsg("database with OID %u does not exist", u_sess->proc_cxt.MyDatabaseId)));
        }
        CommitTransactionCommand();
        /* CommitTransactionCommand switches to t_thrd.top_mem_cxt */
        (void)MemoryContextSwitchTo(cur);
    }

    /* Send a RowDescription message */
    pq_beginmessage(&buf, 'T');
    pq_sendint16(&buf, 4); /* 4 fields */

    /* first field */
    pq_sendstring(&buf, "systemid"); /* col name */
    pq_sendint32(&buf, 0);           /* table oid */
    pq_sendint16(&buf, 0);           /* attnum */
    pq_sendint32(&buf, TEXTOID);     /* type oid */
    pq_sendint16(&buf, UINT16_MAX);  /* typlen */
    pq_sendint32(&buf, 0);           /* typmod */
    pq_sendint16(&buf, 0);           /* format code */

    /* second field */
    pq_sendstring(&buf, "timeline"); /* col name */
    pq_sendint32(&buf, 0);           /* table oid */
    pq_sendint16(&buf, 0);           /* attnum */
    pq_sendint32(&buf, INT4OID);     /* type oid */
    pq_sendint16(&buf, 4);           /* typlen */
    pq_sendint32(&buf, 0);           /* typmod */
    pq_sendint16(&buf, 0);           /* format code */

    /* third field */
    pq_sendstring(&buf, "xlogpos"); /* col name */
    pq_sendint32(&buf, 0);          /* table oid */
    pq_sendint16(&buf, 0);          /* attnum */
    pq_sendint32(&buf, TEXTOID);    /* type oid */
    pq_sendint16(&buf, UINT16_MAX); /* typlen */
    pq_sendint32(&buf, 0);          /* typmod */
    pq_sendint16(&buf, 0);          /* format code */

    /* fourth field */
    pq_sendstring(&buf, "dbname");  /* col name */
    pq_sendint32(&buf, 0);          /* table oid */
    pq_sendint16(&buf, 0);          /* attnum */
    pq_sendint32(&buf, TEXTOID);    /* type oid */
    pq_sendint16(&buf, UINT16_MAX); /* typlen */
    pq_sendint32(&buf, 0);          /* typmod */
    pq_sendint16(&buf, 0);          /* format code */
    pq_endmessage_noblock(&buf);

    /* Send a DataRow message */
    pq_beginmessage(&buf, 'D');
    pq_sendint16(&buf, 4);             /* # of columns */
    pq_sendint32(&buf, strlen(sysid)); /* col1 len */
    pq_sendbytes(&buf, (char *)sysid, strlen(sysid));
    pq_sendint32(&buf, strlen(tli)); /* col2 len */
    pq_sendbytes(&buf, (char *)tli, strlen(tli));
    pq_sendint32(&buf, strlen(xpos)); /* col3 len */
    pq_sendbytes(&buf, (char *)xpos, strlen(xpos));
    /* send NULL if not connected to a database */
    if (dbname != NULL) {
        pq_sendint32(&buf, strlen(dbname)); /* col4 len */
        pq_sendbytes(&buf, (char *)dbname, strlen(dbname));
    } else {
        pq_sendint32(&buf, UINT32_MAX); /* col4 len, NULL */
    }
    pq_endmessage_noblock(&buf);

    /* Send CommandComplete and ReadyForQuery messages */
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
    /* ReadyForQuery did pq_flush_if_available for us */
}

/*
 * IDENTIFY_VERSION
 */
static void IdentifyVersion(void)
{
    StringInfoData buf;
    char pg_sversion[11] = {0};
    char pg_pversion[32] = {0};
    char term[11] = {0};
    uint32 sys_version = PG_VERSION_NUM;
    int nRet = 0;
    errno_t rc = EOK;

    nRet = snprintf_s(pg_sversion, sizeof(pg_sversion), sizeof(pg_sversion) - 1, "%u", sys_version);
    securec_check_ss(nRet, "\0", "\0");

    rc = strncpy_s(pg_pversion, sizeof(pg_pversion), PG_PROTOCOL_VERSION, strlen(PG_PROTOCOL_VERSION));
    securec_check(rc, "\0", "\0");
    uint32 term_cur = Max(g_instance.comm_cxt.localinfo_cxt.term_from_file,
                          g_instance.comm_cxt.localinfo_cxt.term_from_xlog);
    nRet = snprintf_s(term, sizeof(term), sizeof(term) - 1, "%u", term_cur);
    securec_check_ss(nRet, "\0", "\0");
    pg_pversion[strlen(PG_PROTOCOL_VERSION)] = '\0';

    /* Send a RowDescription message */
    pq_beginmessage(&buf, 'T');
    pq_sendint16(&buf, 3); /* 3 fields */

    /* first field */
    pq_sendstring(&buf, "sversion"); /* col name */
    pq_sendint32(&buf, 0);           /* table oid */
    pq_sendint16(&buf, 0);           /* attnum */
    pq_sendint32(&buf, INT4OID);     /* type oid */
    pq_sendint16(&buf, 4);           /* typlen */
    pq_sendint32(&buf, 0);           /* typmod */
    pq_sendint16(&buf, 0);           /* format code */

    /* second field */
    pq_sendstring(&buf, "pversion"); /* col name */
    pq_sendint32(&buf, 0);           /* table oid */
    pq_sendint16(&buf, 0);           /* attnum */
    pq_sendint32(&buf, TEXTOID);     /* type oid */
    pq_sendint16(&buf, UINT16_MAX);  /* typlen */
    pq_sendint32(&buf, 0);           /* typmod */
    pq_sendint16(&buf, 0);           /* format code */

    /* first field */
    pq_sendstring(&buf, "term"); /* col name */
    pq_sendint32(&buf, 0);       /* table oid */
    pq_sendint16(&buf, 0);       /* attnum */
    pq_sendint32(&buf, INT4OID); /* type oid */
    pq_sendint16(&buf, 4);       /* typlen */
    pq_sendint32(&buf, 0);       /* typmod */
    pq_sendint16(&buf, 0);       /* format code */
    pq_endmessage_noblock(&buf);

    /* Send a DataRow message */
    pq_beginmessage(&buf, 'D');
    pq_sendint16(&buf, 3);                   /* # of columns */
    pq_sendint32(&buf, strlen(pg_sversion)); /* col1 len */
    pq_sendbytes(&buf, (char *)pg_sversion, strlen(pg_sversion));
    pq_sendint32(&buf, strlen(pg_pversion)); /* col2 len */
    pq_sendbytes(&buf, (char *)pg_pversion, strlen(pg_pversion));
    pq_sendint32(&buf, strlen(term)); /* col2 len */
    pq_sendbytes(&buf, (char *)term, strlen(term));
    pq_endmessage_noblock(&buf);

    /* Send CommandComplete and ReadyForQuery messages */
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
    /* ReadyForQuery did pq_flush_if_available for us */
}

/*
 * IDENTIFY_MODE extern  for datasender
 */
void IdentifyMode(void)
{
    StringInfoData buf;
    char smode[11];
    volatile HaShmemData *hashmdata = t_thrd.postmaster_cxt.HaShmData;
    int nRet = 0;
    ServerMode current_mode = UNKNOWN_MODE;

    SpinLockAcquire(&hashmdata->mutex);
    if (hashmdata->current_mode == STANDBY_MODE && hashmdata->is_cascade_standby) {
        current_mode = CASCADE_STANDBY_MODE;
    } else if (IS_SHARED_STORAGE_MODE && (hashmdata->current_mode == STANDBY_MODE)) {
        if (WalRcvIsOnline() && (hashmdata->repl_reason[hashmdata->current_repl] == NONE_REBUILD ||
            hashmdata->repl_reason[hashmdata->current_repl] == CONNECT_REBUILD)) {
            current_mode = hashmdata->is_hadr_main_standby? MAIN_STANDBY_MODE : hashmdata->current_mode;
        }
#ifdef ENABLE_MULTIPLE_NODES
    } else if (IS_PGXC_COORDINATOR && hashmdata->current_mode == NORMAL_MODE && RecoveryInProgress()) {
        current_mode = RECOVERY_MODE;
#endif
    } else {
        current_mode = hashmdata->current_mode;
    }
    nRet = snprintf_s(smode, sizeof(smode), sizeof(smode) - 1, "%d", current_mode);
    securec_check_ss(nRet, "\0", "\0");
    SpinLockRelease(&hashmdata->mutex);

    /* Send a RowDescription message */
    pq_beginmessage(&buf, 'T');
    pq_sendint16(&buf, 1); /* 1 fields */

    /* first field */
    pq_sendstring(&buf, "smode"); /* col name */
    pq_sendint32(&buf, 0);        /* table oid */
    pq_sendint16(&buf, 0);        /* attnum */
    pq_sendint32(&buf, INT4OID);  /* type oid */
    pq_sendint16(&buf, 4);        /* typlen */
    pq_sendint32(&buf, 0);        /* typmod */
    pq_sendint16(&buf, 0);        /* format code */
    pq_endmessage_noblock(&buf);

    /* Send a DataRow message */
    pq_beginmessage(&buf, 'D');
    pq_sendint16(&buf, 1);             /* # of columns */
    pq_sendint32(&buf, strlen(smode)); /* col1 len */
    pq_sendbytes(&buf, (char *)smode, strlen(smode));
    pq_endmessage_noblock(&buf);

    /* Send CommandComplete and ReadyForQuery messages */
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
    /* ReadyForQuery did pq_flush_if_available for us */
}

#ifndef ENABLE_MULTIPLE_NODES
/*
 * IDENTIFY_AZ
 */
void IdentifyAvailableZone(void)
{
    StringInfoData buf;

    /* Send a RowDescription message */
    pq_beginmessage(&buf, 'T');
    pq_sendint16(&buf, 1); /* 1 fields */

    /* first field */
    pq_sendstring(&buf, "azname"); /* col name */
    pq_sendint32(&buf, 0);          /* table oid */
    pq_sendint16(&buf, 0);          /* attnum */
    pq_sendint32(&buf, TEXTOID);    /* type oid */
    pq_sendint16(&buf, UINT16_MAX); /* typlen */
    pq_sendint32(&buf, 0);          /* typmod */
    pq_sendint16(&buf, 0);          /* format code */
    pq_endmessage_noblock(&buf);

    /* Send a DataRow message */
    pq_beginmessage(&buf, 'D');
    pq_sendint16(&buf, 1);             /* # of columns */
    char* azname = g_instance.attr.attr_storage.available_zone;
    pq_sendint32(&buf, strlen(azname)); /* col1 len */
    pq_sendbytes(&buf, (char*)azname, strlen(azname));
    pq_endmessage_noblock(&buf);

    /* Send CommandComplete and ReadyForQuery messages */
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
    /* ReadyForQuery did pq_flush_if_available for us */
}
#endif

/*
 * IDENTIFY_MAXLSN
 * This LSN contains two part,node name and XLogRecPtr
 * One case is CN build DN and get current latest flushed LSN here
 */
static void IdentifyMaxLsn(void)
{
    int nRet = 0;
    StringInfoData buf;
    char str[MAXFNAMELEN];
    char recptr[MAXFNAMELEN];

    XLogRecPtr ptr = GetFlushRecPtr();

    nRet = snprintf_s(recptr, sizeof(recptr), sizeof(recptr) - 1, "%X/%X", (uint32)(ptr >> 32), (uint32)ptr);
    securec_check_ss(nRet, "\0", "\0");
    nRet = snprintf_s(str, sizeof(str), sizeof(str) - 1, "%s|%s", g_instance.attr.attr_common.PGXCNodeName, recptr);
    securec_check_ss(nRet, "\0", "\0");

    pq_beginmessage(&buf, 'T'); /* RowDescription */
    pq_sendint16(&buf, 1);      /* 1 field */

    /* Field header */
    pq_sendstring(&buf, "recptr");
    pq_sendint32(&buf, 0);       /* table oid */
    pq_sendint16(&buf, 0);       /* attnum */
    pq_sendint32(&buf, TEXTOID); /* type oid */
    pq_sendint16(&buf, UINT16_MAX);
    pq_sendint32(&buf, 0);
    pq_sendint16(&buf, 0);
    pq_endmessage_noblock(&buf);

    /* Data row */
    pq_beginmessage(&buf, 'D');
    pq_sendint16(&buf, 1);           /* number of columns */
    pq_sendint32(&buf, strlen(str)); /* length */
    pq_sendbytes(&buf, str, strlen(str));
    pq_endmessage_noblock(&buf);

    /* Send CommandComplete and ReadyForQuery messages */
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
    /* ReadyForQuery did pq_flush_if_available for us */
}

/*
 * IDENTIFY_CONSISTENCE
 * identify consistence of primary and standby
 */
static void IdentifyConsistence(IdentifyConsistenceCmd *cmd)
{
    StringInfoData buf;
    char crc[CRC_LEN] = {0};
    char maxLsnCrcStr[CRC_LEN] = {0};
    pg_crc32 requestRecCrc = 0;
    pg_crc32 localMaxLsnCrc = 0;
    bool crcValid = false;
    XLogRecPtr localMaxPtr = InvalidXLogRecPtr;
    ;
    char strMaxPtr[MAXFNAMELEN] = {0};
    int nRet = 0;
    char msgBuf[XLOG_READER_MAX_MSGLENTH] = {0};

    requestRecCrc = GetXlogRecordCrc(cmd->recordptr, crcValid, XLogPageRead, 0);

    /* To support grayupgrade, msg with 1 row of 2 or 3 colums is used
     * according to working version number. Will remove later.
     */
    if (t_thrd.proc && t_thrd.proc->workingVersionNum >= 92060) {
        /* Don't care max xlog when check with building process */
        if (IsWalSenderToBuild() == false) {
            if (dummyStandbyMode) {
                localMaxPtr = FindMaxLSN(t_thrd.proc_cxt.DataDir, msgBuf, XLOG_READER_MAX_MSGLENTH, &localMaxLsnCrc);
            } else {
                if (AM_WAL_STANDBY_SENDER) {
                    (void)GetXLogReplayRecPtr(NULL, &localMaxPtr);
                    localMaxLsnCrc = GetXlogRecordCrc(localMaxPtr, crcValid, XLogPageRead, 0);
                } else {
                    localMaxPtr = FindMaxLSN(t_thrd.proc_cxt.DataDir, msgBuf, XLOG_READER_MAX_MSGLENTH,
                                             &localMaxLsnCrc);
                }
            }

            ereport(LOG, (errmsg("remote request lsn/crc: [%X/%X, %u] "
                                 "local max lsn/crc: [%X/%X, %u]",
                                 (uint32)(cmd->recordptr >> 32), (uint32)cmd->recordptr, (uint32)requestRecCrc,
                                 (uint32)(localMaxPtr >> 32), (uint32)localMaxPtr, (uint32)localMaxLsnCrc)));
        }

        if (requestRecCrc == NONE_REC_CRC && WalSndCaughtup()) {
            requestRecCrc = IGNORE_REC_CRC;
        }

        nRet = snprintf_s(crc, sizeof(crc), sizeof(crc) - 1, "%X", requestRecCrc);
        securec_check_ss(nRet, "\0", "\0");

        nRet = snprintf_s(strMaxPtr, sizeof(strMaxPtr), sizeof(strMaxPtr) - 1, "%X/%X", (uint32)(localMaxPtr >> 32),
                          (uint32)localMaxPtr);
        securec_check_ss(nRet, "\0", "\0");

        nRet = snprintf_s(maxLsnCrcStr, sizeof(maxLsnCrcStr), sizeof(maxLsnCrcStr) - 1, "%X", localMaxLsnCrc);
        securec_check_ss(nRet, "\0", "\0");

        /* Send a RowDescription message */
        pq_beginmessage(&buf, 'T');
        pq_sendint16(&buf, 3); /* 1 fields */

        /* first field */
        pq_sendstring(&buf, "requestRemoteCrc"); /* col name */
        pq_sendint32(&buf, 0);                   /* table oid */
        pq_sendint16(&buf, 0);                   /* attnum */
        pq_sendint32(&buf, TEXTOID);             /* type oid */
        pq_sendint16(&buf, UINT16_MAX);          /* typlen */
        pq_sendint32(&buf, 0);                   /* typmod */
        pq_sendint16(&buf, 0);                   /* format code */

        /* second field */
        pq_sendstring(&buf, "localMaxLsn"); /* col name */
        pq_sendint32(&buf, 0);              /* table oid */
        pq_sendint16(&buf, 1);              /* attnum */
        pq_sendint32(&buf, TEXTOID);        /* type oid */
        pq_sendint16(&buf, UINT16_MAX);     /* typlen */
        pq_sendint32(&buf, 0);              /* typmod */
        pq_sendint16(&buf, 0);              /* format code */

        /* third field */
        pq_sendstring(&buf, "localMaxLsnCrc"); /* col name */
        pq_sendint32(&buf, 0);                 /* table oid */
        pq_sendint16(&buf, 2);                 /* attnum */
        pq_sendint32(&buf, TEXTOID);           /* type oid */
        pq_sendint16(&buf, UINT16_MAX);        /* typlen */
        pq_sendint32(&buf, 0);                 /* typmod */
        pq_sendint16(&buf, 0);                 /* format code */

        pq_endmessage_noblock(&buf);

        /* Send a DataRow message */
        pq_beginmessage(&buf, 'D');
        pq_sendint16(&buf, 3);           /* # of columns */
        pq_sendint32(&buf, strlen(crc)); /* col1 len */
        pq_sendbytes(&buf, (char *)crc, strlen(crc));
        pq_sendint32(&buf, strlen(strMaxPtr)); /* col2 len */
        pq_sendbytes(&buf, (char *)strMaxPtr, strlen(strMaxPtr));
        pq_sendint32(&buf, strlen(maxLsnCrcStr)); /* col3 len */
        pq_sendbytes(&buf, (char *)maxLsnCrcStr, strlen(maxLsnCrcStr));
        pq_endmessage_noblock(&buf);
    } else {
        char havexlog[8] = {0};
        if (dummyStandbyMode) {
            if (crcValid) {
                havexlog[0] = '1';
            } else {
                localMaxPtr = FindMaxLSN(t_thrd.proc_cxt.DataDir, msgBuf, XLOG_READER_MAX_MSGLENTH, &localMaxLsnCrc);
                if (XLByteLT(localMaxPtr, cmd->recordptr) || XLByteEQ(localMaxPtr, InvalidXLogRecPtr)) {
                    havexlog[0] = '0';
                } else {
                    havexlog[0] = '1';
                }
            }
            ereport(LOG, (errmsg("standby rec: %x/%x, havexlog: %s, crc:%u", (uint32)(cmd->recordptr >> 32),
                                 (uint32)cmd->recordptr, havexlog, (uint32)requestRecCrc)));
        } else {
            havexlog[0] = '1'; /* have xlog be true if in primary mode */
        }

        nRet = snprintf_s(crc, sizeof(crc), sizeof(crc) - 1, "%X", requestRecCrc);
        securec_check_ss(nRet, "\0", "\0");

        /* Send a RowDescription message */
        pq_beginmessage(&buf, 'T');
        pq_sendint16(&buf, 2); /* 1 fields */

        /* first field */
        pq_sendstring(&buf, "reccrc");  /* col name */
        pq_sendint32(&buf, 0);          /* table oid */
        pq_sendint16(&buf, 0);          /* attnum */
        pq_sendint32(&buf, TEXTOID);    /* type oid */
        pq_sendint16(&buf, UINT16_MAX); /* typlen */
        pq_sendint32(&buf, 0);          /* typmod */
        pq_sendint16(&buf, 0);          /* format code */

        /* sencond field */
        pq_sendstring(&buf, "havexlog"); /* col name */
        pq_sendint32(&buf, 0);           /* table oid */
        pq_sendint16(&buf, 0);           /* attnum */
        pq_sendint32(&buf, INT4OID);     /* type oid */
        pq_sendint16(&buf, 4);           /* typlen */
        pq_sendint32(&buf, 0);           /* typmod */
        pq_sendint16(&buf, 0);           /* format code */
        pq_endmessage_noblock(&buf);

        /* Send a DataRow message */
        pq_beginmessage(&buf, 'D');
        pq_sendint16(&buf, 2);           /* # of columns */
        pq_sendint32(&buf, strlen(crc)); /* col1 len */
        pq_sendbytes(&buf, (char *)crc, strlen(crc));
        pq_sendint32(&buf, strlen(havexlog)); /* col2 len */
        pq_sendbytes(&buf, (char *)havexlog, strlen(havexlog));
        pq_endmessage_noblock(&buf);
    }

    /* Send CommandComplete and ReadyForQuery messages */
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
    /* ReadyForQuery did pq_flush_if_available for us */
}

/*
 * IDENTIFY_CHANNEL
 * get channel identifier from standby
 */
static void IdentifyChannel(IdentifyChannelCmd *cmd)
{
    StringInfoData buf;

    t_thrd.walsender_cxt.remotePort = cmd->channel_identifier;
    bool is_success = UpdateHaWalSenderChannel(t_thrd.walsender_cxt.remotePort);

    const char *result = is_success ? "t" : "f";
    size_t result_len = strlen(result);

    /* Send a RowDescription message */
    pq_beginmessage(&buf, 'T');
    pq_sendint16(&buf, 1); /* 1 fields */

    /* first field */
    pq_sendstring(&buf, "identifier"); /* col name */
    pq_sendint32(&buf, 0);             /* table oid */
    pq_sendint16(&buf, 0);             /* attnum */
    pq_sendint32(&buf, BOOLOID);       /* type oid */
    pq_sendint16(&buf, 1);             /* typlen */
    pq_sendint32(&buf, 0);             /* typmod */
    pq_sendint16(&buf, 0);             /* format code */
    pq_endmessage_noblock(&buf);

    /* Send a DataRow message */
    pq_beginmessage(&buf, 'D');
    pq_sendint16(&buf, 1);          /* # of columns */
    pq_sendint32(&buf, result_len); /* col1 len */
    pq_sendbytes(&buf, result, result_len);
    pq_endmessage_noblock(&buf);

    /* Send CommandComplete and ReadyForQuery messages */
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
}

/*
 * START_REPLICATION
 */
static void StartReplication(StartReplicationCmd *cmd)
{
    StringInfoData buf;

    /*
     * When promoting a cascading standby, postmaster sends SIGUSR2 to any
     * cascading walsenders to kill them. But there is a corner-case where
     * such walsender fails to receive SIGUSR2 and survives a standby
     * promotion unexpectedly. This happens when postmaster sends SIGUSR2
     * before the walsender marks itself as a WAL sender, because postmaster
     * sends SIGUSR2 to only the processes marked as a WAL sender.
     *
     * To avoid this corner-case, if recovery is NOT in progress even though
     * the walsender is cascading one, we do the same thing as SIGUSR2 signal
     * handler does, i.e., set t_thrd.walsender_cxt.walsender_ready_to_stop to true. Which causes
     * the walsender to end later.
     *
     * When terminating cascading walsenders, usually postmaster writes the
     * log message announcing the terminations. But there is a race condition
     * here. If there is no walsender except this process before reaching
     * here, postmaster thinks that there is no walsender and suppresses that
     * log message. To handle this case, we always emit that log message here.
     * This might cause duplicate log messages, but which is less likely to
     * happen, so it's not worth writing some code to suppress them.
     */
    if (AM_WAL_STANDBY_SENDER && !RecoveryInProgress()) {
        ereport(LOG, (errmsg("terminating walsender process to force cascaded standby "
                             "to update timeline and reconnect")));
        t_thrd.walsender_cxt.walsender_ready_to_stop = true;
    }

    /*
     * We assume here that we're logging enough information in the WAL for
     * log-shipping, since this is checked in PostmasterMain().
     *
     * NOTE: wal_level can only change at shutdown, so in most cases it is
     * difficult for there to be WAL data that we can still see that was
     * written at wal_level='minimal'.
     */
    if (cmd->slotname) {
        ReplicationSlotAcquire(cmd->slotname, AmWalSenderToDummyStandby() ? true : false);
        if (t_thrd.slot_cxt.MyReplicationSlot->data.database != InvalidOid)
            ereport(ERROR, (errcode(ERRCODE_OBJECT_NOT_IN_PREREQUISITE_STATE),
                            (errmsg("cannot use a logical replication slot for physical replication"))));
    }

    /*
     * When we first start replication the standby will be behind the primary.
     * For some applications, for example, synchronous replication, it is
     * important to have a clear state for this initial catchup mode, so we
     * can trigger actions when we change streaming state later. We may stay
     * in this state for a long time, which is exactly why we want to be able
     * to monitor whether or not we are still here.
     */
    WalSndSetState(WALSNDSTATE_CATCHUP);

    /* Send a CopyBothResponse message, and start streaming */
    pq_beginmessage(&buf, 'W');
    pq_sendbyte(&buf, 0);
    pq_sendint16(&buf, 0);
    pq_endmessage_noblock(&buf);
    pq_flush_timedwait(WalSndTimeout());

    /*
     * Initialize position to the received one, then the xlog records begin to
     * be shipped from that position
     */
    if (AmWalSenderToDummyStandby())
        ChooseStartPointForDummyStandby();
    else {
        t_thrd.walsender_cxt.sentPtr = cmd->startpoint;
        WalSndSetPercentCountStartLsn(cmd->startpoint);
    }
}

/*
 * read_page callback for logical decoding contexts, as a walsender process.
 *
 * Inside the walsender we can do better than logical_read_local_xlog_page,
 * which has to do a plain sleep/busy loop, because the walsender's latch gets
 * set everytime WAL is flushed.
 */
int logical_read_xlog_page(XLogReaderState *state, XLogRecPtr targetPagePtr, int reqLen, XLogRecPtr targetRecPtr,
    char *cur_page, TimeLineID *pageTLI, char* xlog_path)
{
    XLogRecPtr flushptr;
    int count;

    /* make sure we have enough WAL available */
    flushptr = WalSndWaitForWal(targetPagePtr + reqLen);
    /* fail if not (implies we are going to shut down) */
    if (flushptr < targetPagePtr + reqLen)
        return -1;

    if (targetPagePtr + XLOG_BLCKSZ <= flushptr)
        count = XLOG_BLCKSZ; /* more than one block available */
    else
        count = flushptr - targetPagePtr; /* part of the page available */

    /* now actually read the data, we know it's there */
    XLogRead(cur_page, targetPagePtr, XLOG_BLCKSZ);

    return count;
}

/*
 * Create a new replication slot.
 */
static void CreateReplicationSlot(CreateReplicationSlotCmd *cmd)
{
#define MAX_ULONG_LENGTH 22
    const char *slot_name = NULL;
    StringInfoData buf;
    bool isDummyStandby = false;
    const char *snapshot_name = NULL;
    Snapshot snap;
    char xpos[MAXFNAMELEN];
    char strCSN[MAX_ULONG_LENGTH];
    int rc = 0;

    Assert(!t_thrd.slot_cxt.MyReplicationSlot);

    /* setup state for XLogReadPage */
    isDummyStandby = AmWalSenderToDummyStandby() ? true : false;

    if (cmd->kind == REPLICATION_KIND_LOGICAL) {
        MarkPostmasterChildNormal();
        CheckPMstateAndRecoveryInProgress();
        CheckLogicalDecodingRequirements(u_sess->proc_cxt.MyDatabaseId);
        /*
         * Initially create the slot as ephemeral - that allows us to nicely
         * handle errors during initialization because it'll get dropped if
         * this transaction fails. We'll make it persistent at the end.
         */
        ReplicationSlotCreate(cmd->slotname, RS_EPHEMERAL, isDummyStandby, u_sess->proc_cxt.MyDatabaseId,
                              InvalidXLogRecPtr);
    } else {
        /*
         * physical slot save init value if exist
         */
        ReplicationSlotCreate(cmd->slotname, RS_PERSISTENT, isDummyStandby, InvalidOid, cmd->init_slot_lsn);
    }
    slot_name = NameStr(t_thrd.slot_cxt.MyReplicationSlot->data.name);

    if (cmd->kind == REPLICATION_KIND_LOGICAL) {
        ValidateInputString(cmd->slotname);
        ValidateInputString(cmd->plugin);
        char *fullname = NULL;

        /*
         * Do options check early so that we can bail before calling the
         * DecodingContextFindStartpoint which can take long time.
         */
        if (cmd->useSnapshot) {
            if (!IsTransactionBlock()) {
                ereport(ERROR, (errmsg("CREATE_REPLICATION_SLOT ... USE_SNAPSHOT "
                                       "must be called inside a transaction")));
            }
            if (u_sess->utils_cxt.XactIsoLevel != XACT_REPEATABLE_READ) {
                ereport(ERROR, (errmsg("CREATE_REPLICATION_SLOT ... USE_SNAPSHOT "
                                       "must be called in REPEATABLE READ isolation mode transaction")));
            }
            if (u_sess->utils_cxt.FirstSnapshotSet) {
                ereport(ERROR, (errmsg("CREATE_REPLICATION_SLOT ... USE_SNAPSHOT must be called before any query")));
            }
            if (IsSubTransaction())
                ereport(ERROR, (errmsg("CREATE_REPLICATION_SLOT ... USE_SNAPSHOT "
                                       "must not be called in a subtransaction")));
        }
        fullname = expand_dynamic_library_name(cmd->plugin);

        /* Load the shared library, unless we already did */
        (void)internal_load_library(fullname);

        LogicalDecodingContext *ctx = NULL;

        ctx = CreateInitDecodingContext(cmd->plugin, NIL, true, logical_read_xlog_page, WalSndPrepareWrite,
                                        WalSndWriteData);

        /* build initial snapshot, might take a while */
        DecodingContextFindStartpoint(ctx);

        if (!cmd->useSnapshot) {
            /*
             * Export a plain (not of the snapbuild.c type) snapshot to the user
             * that can be imported into another session.
             */
            snapshot_name = SnapBuildExportSnapshot(ctx->snapshot_builder);
        } else {
            t_thrd.walsender_cxt.isUseSnapshot = true;

            snap = SnapBuildInitialSnapshot(ctx->snapshot_builder);
            SetTransactionSnapshot(snap, NULL, InvalidPid);
            rc = snprintf_s(strCSN, MAX_ULONG_LENGTH, MAX_ULONG_LENGTH - 1, "%lu", snap->snapshotcsn);
            securec_check_ss(rc, "\0", "\0");
        }

        /* don't need the decoding context anymore */
        FreeDecodingContext(ctx);

        ReplicationSlotPersist();

        // write xlog
        log_slot_create(&t_thrd.slot_cxt.MyReplicationSlot->data);
    }

    rc = snprintf_s(xpos, sizeof(xpos), sizeof(xpos) - 1, "%X/%X",
                    (uint32)(t_thrd.slot_cxt.MyReplicationSlot->data.confirmed_flush >> 32),
                    (uint32)t_thrd.slot_cxt.MyReplicationSlot->data.confirmed_flush);
    securec_check_ss(rc, "\0", "\0");

    /*
     * It may seem somewhat pointless to send back the same slot name the
     * client just requested and nothing else, but logical replication
     * will add more fields here.  (We could consider removing the slot
     * name from what's sent back, though, since the client has specified
     * that.)
     */
    pq_beginmessage(&buf, 'T');
    if (cmd->useSnapshot) {
        pq_sendint16(&buf, 5); /* 5 field */
    } else {
        pq_sendint16(&buf, 4); /* 4 field */
    }

    /* first field: slot name */
    pq_sendstring(&buf, "slot_name"); /* col name */
    pq_sendint32(&buf, 0);            /* table oid */
    pq_sendint16(&buf, 0);            /* attnum */
    pq_sendint32(&buf, TEXTOID);      /* type oid */
    pq_sendint16(&buf, UINT16_MAX);   /* typlen */
    pq_sendint32(&buf, 0);            /* typmod */
    pq_sendint16(&buf, 0);            /* format code */

    /* second field: LSN at which we became consistent */
    pq_sendstring(&buf, "consistent_point"); /* col name */
    pq_sendint32(&buf, 0);                   /* table oid */
    pq_sendint16(&buf, 0);                   /* attnum */
    pq_sendint32(&buf, TEXTOID);             /* type oid */
    pq_sendint16(&buf, UINT16_MAX);          /* typlen */
    pq_sendint32(&buf, 0);                   /* typmod */
    pq_sendint16(&buf, 0);                   /* format code */

    /* third field: exported snapshot's name */
    pq_sendstring(&buf, "snapshot_name"); /* col name */
    pq_sendint32(&buf, 0);                /* table oid */
    pq_sendint16(&buf, 0);                /* attnum */
    pq_sendint32(&buf, TEXTOID);          /* type oid */
    pq_sendint16(&buf, UINT16_MAX);       /* typlen */
    pq_sendint32(&buf, 0);                /* typmod */
    pq_sendint16(&buf, 0);                /* format code */

    /* fourth field: output plugin */
    pq_sendstring(&buf, "output_plugin"); /* col name */
    pq_sendint32(&buf, 0);                /* table oid */
    pq_sendint16(&buf, 0);                /* attnum */
    pq_sendint32(&buf, TEXTOID);          /* type oid */
    pq_sendint16(&buf, UINT16_MAX);       /* typlen */
    pq_sendint32(&buf, 0);                /* typmod */
    pq_sendint16(&buf, 0);                /* format code */

    if (cmd->useSnapshot) {
        /* fifth field: use snapshot's csn */
        pq_sendstring(&buf, "snapshot_csn"); /* col name */
        pq_sendint32(&buf, 0);                /* table oid */
        pq_sendint16(&buf, 0);                /* attnum */
        pq_sendint32(&buf, TEXTOID);          /* type oid */
        pq_sendint16(&buf, UINT16_MAX);       /* typlen */
        pq_sendint32(&buf, 0);                /* typmod */
        pq_sendint16(&buf, 0);                /* format code */
    }
    pq_endmessage_noblock(&buf);

    /* Send a DataRow message */
    pq_beginmessage(&buf, 'D');
    if (cmd->useSnapshot) {
        pq_sendint16(&buf, 5); /* # of columns */
    } else {
        pq_sendint16(&buf, 4); /* # of columns */
    }

    /* slot_name */
    pq_sendint32(&buf, strlen(slot_name)); /* col1 len */
    pq_sendbytes(&buf, slot_name, strlen(slot_name));

    /* consistent wal location */
    pq_sendint32(&buf, strlen(xpos)); /* col2 len */
    pq_sendbytes(&buf, xpos, strlen(xpos));

    /* snapshot name */
    if (snapshot_name != NULL) {
        pq_sendint32(&buf, strlen(snapshot_name)); /* col3 len */
        pq_sendbytes(&buf, snapshot_name, strlen(snapshot_name));
    } else {
        pq_sendint32(&buf, UINT32_MAX); /* col3 len, NULL */
    }

    /* plugin */
    if (cmd->plugin != NULL) {
        pq_sendint32(&buf, strlen(cmd->plugin)); /* col4 len */
        pq_sendbytes(&buf, cmd->plugin, strlen(cmd->plugin));
    } else
        pq_sendint32(&buf, UINT32_MAX); /* col4 len, NULL */

    /* snapshot csn */
    if (cmd->useSnapshot) {
        pq_sendint32(&buf, strlen(strCSN)); /* col5 len */
        pq_sendbytes(&buf, strCSN, strlen(strCSN));
    }
    pq_endmessage_noblock(&buf);

    /* Send CommandComplete and ReadyForQuery messages */
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
    /* ReadyForQuery did pq_flush_if_available for us
     *
     * release active status again, START_REPLICATION will reacquire it
     */
    ReplicationSlotRelease();
}

/* Determine if it is a logical slot */
bool IsLogicalSlot(const char *name)
{
    bool ret = false;

    LWLockAcquire(ReplicationSlotControlLock, LW_SHARED);
    for (int i = 0; i < g_instance.attr.attr_storage.max_replication_slots; i++) {
        ReplicationSlot *s = &t_thrd.slot_cxt.ReplicationSlotCtl->replication_slots[i];

        if (s->in_use && strcmp(name, NameStr(s->data.name)) == 0 && s->data.database != InvalidOid) {
            ret = true;
            break;
        }
    }
    LWLockRelease(ReplicationSlotControlLock);

    return ret;
}

/*
 * Get rid of a replication slot that is no longer wanted.
 */
static void DropReplicationSlot(DropReplicationSlotCmd *cmd)
{
    if (IsLogicalSlot(cmd->slotname)) {
        MarkPostmasterChildNormal();
        CheckPMstateAndRecoveryInProgress();
        ReplicationSlotDrop(cmd->slotname, false, !cmd->wait);
        log_slot_drop(cmd->slotname);
    } else {
        ReplicationSlotDrop(cmd->slotname);
    }

    EndCommand_noblock("DROP_REPLICATION_SLOT", DestRemote);
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
}

/*
 * Load previously initiated logical slot and prepare for sending data (via
 * WalSndLoop).
 */
static void StartLogicalReplication(StartReplicationCmd *cmd)
{
    StringInfoData buf;

    /* make sure that our requirements are still fulfilled */
    CheckLogicalDecodingRequirements(u_sess->proc_cxt.MyDatabaseId);

    Assert(!t_thrd.slot_cxt.MyReplicationSlot);

    ReplicationSlotAcquire(cmd->slotname, AmWalSenderToDummyStandby() ? true : false);

    /*
     * Force a disconnect, so that the decoding code doesn't need to care
     * about a eventual switch from running in recovery, to running in a
     * normal environment. Client code is expected to handle reconnects.
     */
    if (AM_WAL_STANDBY_SENDER && !RecoveryInProgress()) {
        ereport(LOG, (errmsg("terminating walsender process after promotion")));
        t_thrd.walsender_cxt.walsender_ready_to_stop = true;
    }

    if (!AM_WAL_DB_SENDER) {
        t_thrd.role = WAL_DB_SENDER;
    }

    /* Rebuild snap dir */
    LogicalCleanSnapDirectory(true);

    WalSndSetState(WALSNDSTATE_CATCHUP);

    /* Send a CopyBothResponse message, and start streaming */
    pq_beginmessage(&buf, 'W');
    pq_sendbyte(&buf, 0);
    pq_sendint(&buf, 0, 2);
    pq_endmessage(&buf);
    pq_flush();

    /*
     * Initialize position to the last ack'ed one, then the xlog records begin
     * to be shipped from that position.
     */
    t_thrd.walsender_cxt.logical_decoding_ctx = CreateDecodingContext(cmd->startpoint, cmd->options, false,
                                                                      logical_read_xlog_page, WalSndPrepareWrite,
                                                                      WalSndWriteData);

    /* Start reading WAL from the oldest required WAL. */
    t_thrd.walsender_cxt.logical_startptr = t_thrd.slot_cxt.MyReplicationSlot->data.restart_lsn;

    /*
     * Report the location after which we'll send out further commits as the
     * current sentPtr.
     */
    t_thrd.walsender_cxt.sentPtr = t_thrd.slot_cxt.MyReplicationSlot->data.confirmed_flush;

    /* Also update the sent position status in shared memory */
    {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

        SpinLockAcquire(&walsnd->mutex);
        walsnd->sentPtr = t_thrd.slot_cxt.MyReplicationSlot->data.restart_lsn;
        SpinLockRelease(&walsnd->mutex);
    }

    SyncRepInitConfig();

    /* Main loop of walsender */
    WalSndLoop(XLogSendLogical);

    FreeDecodingContext(t_thrd.walsender_cxt.logical_decoding_ctx);
    ReplicationSlotRelease();

    if (t_thrd.walsender_cxt.walsender_ready_to_stop)
        proc_exit(0);
    WalSndSetState(WALSNDSTATE_STARTUP);

    /* Get out of COPY mode (CommandComplete). */
    EndCommand("COPY 0", DestRemote);
}

/*
 * Load previously initiated logical slot and prepare for sending data in parallel decoding (via WalSndLoop).
 */
static void StartParallelLogicalReplication(StartReplicationCmd *cmd)
{
    StringInfoData buf;
    int slotId = t_thrd.walsender_cxt.LogicalSlot;
    if (strlen(cmd->slotname) >= NAMEDATALEN) {
        ereport(ERROR, (errmsg("slotname should be shorter than %d! slotname is %s", NAMEDATALEN, cmd->slotname)));
    }
    errno_t rc = memcpy_s(t_thrd.walsender_cxt.slotname, NAMEDATALEN, cmd->slotname, strlen(cmd->slotname));
    securec_check(rc, "\0", "\0");

    if (!AM_WAL_DB_SENDER) {
        t_thrd.role = WAL_DB_SENDER;
    }

    /* Send a CopyBothResponse message, and start streaming */
    pq_beginmessage(&buf, 'W');
    pq_sendbyte(&buf, 0);
    pq_sendint(&buf, 0, 2);
    pq_endmessage(&buf);
    pq_flush();
    t_thrd.walsender_cxt.parallel_logical_decoding_ctx = ParallelCreateDecodingContext(cmd->startpoint, cmd->options,
        false, logical_read_xlog_page, slotId);
    ParallelDecodingData *data = (ParallelDecodingData *)palloc0(sizeof(ParallelDecodingData));
    data->context = (MemoryContext)AllocSetContextCreate(t_thrd.walsender_cxt.parallel_logical_decoding_ctx->context,
        "restore text conversion context", ALLOCSET_DEFAULT_SIZES);

    rc = memcpy_s(&data->pOptions, sizeof(ParallelDecodeOption), &g_Logicaldispatcher[slotId].pOptions,
        sizeof(ParallelDecodeOption));
    securec_check(rc, "\0", "\0");
    g_Logicaldispatcher[slotId].startpoint = cmd->startpoint;
    t_thrd.walsender_cxt.parallel_logical_decoding_ctx->output_plugin_private = data;

    SyncRepInitConfig();

    /* Main loop of walsender */
    WalSndLoop(XLogSendParallelLogical);

    if (t_thrd.slot_cxt.MyReplicationSlot != NULL) {
        ReorderBufferClear(NameStr(t_thrd.slot_cxt.MyReplicationSlot->data.name));
    }

    ReleaseParallelDecodeResource(slotId);

    if (t_thrd.walsender_cxt.walsender_ready_to_stop) {
        proc_exit(0);
    }
    WalSndSetState(WALSNDSTATE_STARTUP);

    /* Get out of COPY mode (CommandComplete). */
    EndCommand("COPY 0", DestRemote);
}

/*
 * Notify the primary to advance logical replication slot.
 */
static void AdvanceLogicalReplication(AdvanceReplicationCmd *cmd)
{
    StringInfoData buf;
    XLogRecPtr flushRecPtr;
    char xpos[MAXFNAMELEN];
    int rc = 0;

    if (RecoveryInProgress()) {
        ereport(ERROR, (errcode(ERRCODE_INVALID_OPERATION),
                        errmsg("couldn't advance in recovery")));
    }

    Assert(!t_thrd.slot_cxt.MyReplicationSlot);

    /*
     * We can't move slot past what's been flushed so clamp the target
     * possition accordingly.
     */
    flushRecPtr = GetFlushRecPtr();
    if (XLByteLT(flushRecPtr, cmd->confirmed_flush)) {
        cmd->confirmed_flush = flushRecPtr;
    }

    if (XLogRecPtrIsInvalid(cmd->confirmed_flush)) {
        ereport(ERROR, (errcode(ERRCODE_INVALID_PARAMETER_VALUE),
                        errmsg("invalid target wal lsn while advancing "
                               "logical replication restart lsn.")));
    }

    /* Acquire the slot so we "own" it */
    ReplicationSlotAcquire(cmd->slotname, false);

    Assert(OidIsValid(t_thrd.slot_cxt.MyReplicationSlot->data.database));

    LogicalConfirmReceivedLocation(cmd->confirmed_flush);

    /* Advance the restart_lsn in primary. */
    volatile ReplicationSlot *slot = t_thrd.slot_cxt.MyReplicationSlot;
    if (XLByteLT(slot->data.restart_lsn, cmd->restart_lsn)) {
        SpinLockAcquire(&slot->mutex);
        slot->data.restart_lsn = cmd->restart_lsn;
        SpinLockRelease(&slot->mutex);

        /* After restart_lsn is updated, the replication slot is saved on disk again */
        ReplicationSlotMarkDirty();
        ReplicationSlotSave();
        ReplicationSlotsComputeRequiredLSN(NULL);
    }

    log_slot_advance(&t_thrd.slot_cxt.MyReplicationSlot->data);

    if (log_min_messages <= DEBUG2) {
        ereport(LOG, (errmsg("AdvanceLogicalReplication, slotname = %s, restart_lsn = %X/%X, "
                             "confirmed_flush = %X/%X.",
                             cmd->slotname,
                             (uint32)(cmd->restart_lsn >> 32),
                             (uint32)cmd->restart_lsn,
                             (uint32)(cmd->confirmed_flush >> 32),
                             (uint32)cmd->confirmed_flush)));
    }

    rc = snprintf_s(xpos, sizeof(xpos), sizeof(xpos) - 1,
                    "%X/%X", (uint32)(cmd->confirmed_flush >> 32), (uint32)cmd->confirmed_flush);
    securec_check_ss(rc, "\0", "\0");

    pq_beginmessage(&buf, 'T');
    pq_sendint16(&buf, 2); /* 2 field */

    /* first field: slot name */
    pq_sendstring(&buf, "slot_name"); /* col name */
    pq_sendint32(&buf, 0);            /* table oid */
    pq_sendint16(&buf, 0);            /* attnum */
    pq_sendint32(&buf, TEXTOID);      /* type oid */
    pq_sendint16(&buf, UINT16_MAX);   /* typlen */
    pq_sendint32(&buf, 0);            /* typmod */
    pq_sendint16(&buf, 0);            /* format code */

    /* second field: LSN at which we became consistent */
    pq_sendstring(&buf, "confirmed_flush"); /* col name */
    pq_sendint32(&buf, 0);                   /* table oid */
    pq_sendint16(&buf, 0);                   /* attnum */
    pq_sendint32(&buf, TEXTOID);             /* type oid */
    pq_sendint16(&buf, UINT16_MAX);          /* typlen */
    pq_sendint32(&buf, 0);                   /* typmod */
    pq_sendint16(&buf, 0);                   /* format code */
    pq_endmessage_noblock(&buf);

    /* Send a DataRow message */
    pq_beginmessage(&buf, 'D');
    pq_sendint16(&buf, 2); /* # of columns */

    /* slot_name */
    pq_sendint32(&buf, strlen(cmd->slotname)); /* col1 len */
    pq_sendbytes(&buf, cmd->slotname, strlen(cmd->slotname));

    /* consistent wal location */
    pq_sendint32(&buf, strlen(xpos)); /* col2 len */
    pq_sendbytes(&buf, xpos, strlen(xpos));
    pq_endmessage_noblock(&buf);

    /* Send CommandComplete and ReadyForQuery messages */
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
    /* ReadyForQuery did pq_flush_if_available for us */

    ReplicationSlotRelease();
}

static void AdvanceCatalogXmin(AdvanceCatalogXminCmd *cmd)
{
    StringInfoData buf;
    char catalogXmin[MAXFNAMELEN];
    int rc = 0;

    if (RecoveryInProgress()) {
        ereport(ERROR, (errcode(ERRCODE_INVALID_OPERATION),
                        errmsg("couldn't advance in recovery")));
    }

    Assert(!t_thrd.slot_cxt.MyReplicationSlot);

    /* Acquire the slot so we "own" it */
    ReplicationSlotAcquire(cmd->slotname, false);

    Assert(OidIsValid(t_thrd.slot_cxt.MyReplicationSlot->data.database));

    /* Advance the catalog_xmin in primary. */
    volatile ReplicationSlot *slot = t_thrd.slot_cxt.MyReplicationSlot;
    if (TransactionIdPrecedes(slot->data.catalog_xmin, cmd->catalogXmin)) {
        SpinLockAcquire(&slot->mutex);
        slot->candidate_catalog_xmin = InvalidTransactionId;
        slot->data.catalog_xmin = cmd->catalogXmin;
        SpinLockRelease(&slot->mutex);

        /* After catalog_xmin is updated, the replication slot is saved on disk again */
        ReplicationSlotMarkDirty();
        ReplicationSlotSave();

        /* Only after catalog_xmin is saved on disk, we can let the global value advance */
        SpinLockAcquire(&slot->mutex);
        slot->effective_catalog_xmin = slot->data.catalog_xmin;
        SpinLockRelease(&slot->mutex);
        ReplicationSlotsComputeRequiredXmin(false);
        log_slot_advance(&t_thrd.slot_cxt.MyReplicationSlot->data);
    }
    rc = snprintf_s(catalogXmin, sizeof(catalogXmin), sizeof(catalogXmin) - 1,
                    "%X/%X", (uint32)(cmd->catalogXmin >> 32), (uint32)cmd->catalogXmin);
    securec_check_ss(rc, "\0", "\0");

    pq_beginmessage(&buf, 'T');
    pq_sendint16(&buf, 2); /* 2 field */

    /* first field: slot name */
    pq_sendstring(&buf, "slot_name"); /* col name */
    pq_sendint32(&buf, 0);            /* table oid */
    pq_sendint16(&buf, 0);            /* attnum */
    pq_sendint32(&buf, TEXTOID);      /* type oid */
    pq_sendint16(&buf, UINT16_MAX);   /* typlen */
    pq_sendint32(&buf, 0);            /* typmod */
    pq_sendint16(&buf, 0);            /* format code */

    /* second field: catalog_xmin */
    pq_sendstring(&buf, "catalog_xmin"); /* col name */
    pq_sendint32(&buf, 0);               /* table oid */
    pq_sendint16(&buf, 0);               /* attnum */
    pq_sendint32(&buf, TEXTOID);         /* type oid */
    pq_sendint16(&buf, UINT16_MAX);      /* typlen */
    pq_sendint32(&buf, 0);               /* typmod */
    pq_sendint16(&buf, 0);               /* format code */
    pq_endmessage_noblock(&buf);

    /* Send a DataRow message */
    pq_beginmessage(&buf, 'D');
    pq_sendint16(&buf, 2); /* # of columns */

    /* slot_name */
    pq_sendint32(&buf, strlen(cmd->slotname)); /* col1 len */
    pq_sendbytes(&buf, cmd->slotname, strlen(cmd->slotname));

    /* catalog_xmin */
    pq_sendint32(&buf, strlen(catalogXmin)); /* col2 len */
    pq_sendbytes(&buf, catalogXmin, strlen(catalogXmin));
    pq_endmessage_noblock(&buf);

    /* Send CommandComplete and ReadyForQuery messages */
    EndCommand_noblock("SELECT", DestRemote);
    ReadyForQuery_noblock(DestRemote, WalSndTimeout());
    /* ReadyForQuery did pq_flush_if_available for us */

    ReplicationSlotRelease();
}

/*
 * Prepare a write into a StringInfo.
 *
 * Don't do anything lasting in here, it's quite possible that nothing will done
 * with the data.
 */
void WalSndPrepareWriteHelper(StringInfo out, XLogRecPtr lsn, TransactionId xid, bool last_write)
{
    /* can't have sync rep confused by sending the same LSN several times */
    if (!last_write) {
        lsn = InvalidXLogRecPtr;
    }
    resetStringInfo(out);
    pq_sendbyte(out, 'w');
    pq_sendint64(out, lsn); /* dataStart */
    pq_sendint64(out, lsn); /* walEnd */
    /*
     * Fill out the sendtime later, just as it's done in XLogSendPhysical, but
     * reserve space here.
     */
    pq_sendint64(out, 0); /* sendtime */
}
/*
 * LogicalDecodingContext 'prepare_write' callback.
 */
static void WalSndPrepareWrite(LogicalDecodingContext *ctx, XLogRecPtr lsn, TransactionId xid, bool last_write)
{
    WalSndPrepareWriteHelper(ctx->out, lsn, xid, last_write);
}

/*
 * Actually write out data previously prepared by WalSndPrepareWrite out to
 * the network. Take as long as needed, but process replies from the other
 * side and check timeouts during that.
 */
void WalSndWriteDataHelper(StringInfo out, XLogRecPtr lsn, TransactionId xid, bool last_write)
{
    errno_t rc;

    /*
     * Fill the send timestamp last, so that it is taken as late as
     * possible. This is somewhat ugly, but the protocol's set as it's already
     * used for several releases by streaming physical replication.
     */
    resetStringInfo(t_thrd.walsender_cxt.tmpbuf);
    pq_sendint64(t_thrd.walsender_cxt.tmpbuf, GetCurrentTimestamp());
    rc = memcpy_s(&(out->data[1 + sizeof(int64) + sizeof(int64)]), out->len,
                  t_thrd.walsender_cxt.tmpbuf->data, sizeof(int64));
    securec_check(rc, "\0", "\0");

    /* output previously gathered data in a CopyData packet */
    pq_putmessage_noblock('d', out->data, out->len);

    CHECK_FOR_INTERRUPTS();

    /* fast path */
    /* Try to flush pending output to the client */
    if (pq_flush_if_writable() != 0)
        WalSndShutdown();

    if (!pq_is_send_pending())
        return;

    for (;;) {
        int wakeEvents;
        long sleeptime;
        TimestampTz now;

        /*
         * Emergency bailout if postmaster has died.  This is to avoid the
         * necessity for manual cleanup of all postmaster children.
         */
        if (!PostmasterIsAlive())
            proc_exit(1);

        /* Process any requests or signals received recently */
        if (t_thrd.walsender_cxt.got_SIGHUP) {
            t_thrd.walsender_cxt.got_SIGHUP = false;
            ProcessConfigFile(PGC_SIGHUP);
            SyncRepInitConfig();
        }

        /* Check for input from the client */
        ProcessRepliesIfAny();

        /* Clear any already-pending wakeups */
        ResetLatch(&t_thrd.walsender_cxt.MyWalSnd->latch);

        /* Try to flush pending output to the client */
        if (pq_flush_if_writable() != 0)
            WalSndShutdown();

        /* If we finished clearing the buffered data, we're done here. */
        if (!pq_is_send_pending())
            break;

        now = GetCurrentTimestamp();

        sleeptime = WalSndComputeSleeptime(now);

        wakeEvents = WL_LATCH_SET | WL_POSTMASTER_DEATH | WL_SOCKET_WRITEABLE | WL_SOCKET_READABLE | WL_TIMEOUT;

        /* Sleep until something happens or we time out */
        t_thrd.int_cxt.ImmediateInterruptOK = true;
        CHECK_FOR_INTERRUPTS();
        WaitLatchOrSocket(&t_thrd.walsender_cxt.MyWalSnd->latch, wakeEvents, u_sess->proc_cxt.MyProcPort->sock,
                          sleeptime);
        t_thrd.int_cxt.ImmediateInterruptOK = false;
    }

    /* reactivate latch so WalSndLoop knows to continue */
    SetLatch(&t_thrd.walsender_cxt.MyWalSnd->latch);
}

/*
 * LogicalDecodingContext 'write' callback.
 */
static void WalSndWriteData(LogicalDecodingContext *ctx, XLogRecPtr lsn, TransactionId xid, bool last_write)
{
    WalSndWriteDataHelper(ctx->out, lsn, xid, last_write);
}

/*
 * Walsender process messages.
 */
static void WalSndHandleMessage(XLogRecPtr *RecentFlushPoint)
{
    /* Process any requests or signals received recently */
    if (t_thrd.walsender_cxt.got_SIGHUP) {
        t_thrd.walsender_cxt.got_SIGHUP = false;
        ProcessConfigFile(PGC_SIGHUP);
        SyncRepInitConfig();
    }

    if (!AM_LOGICAL_READ_RECORD) {
        /* Check for input from the client */
        ProcessRepliesIfAny();

        /* Clear any already-pending wakeups */
        ResetLatch(&t_thrd.walsender_cxt.MyWalSnd->latch);
    }

    /* Update our idea of the currently flushed position. */
    if (!RecoveryInProgress()) {
        *RecentFlushPoint = GetFlushRecPtr();
    } else {
        *RecentFlushPoint = GetXLogReplayRecPtr(NULL);
    }
}

/*
 * Wait till WAL < loc is flushed to disk so it can be safely read.
 */
static XLogRecPtr WalSndWaitForWal(XLogRecPtr loc)
{
    int wakeEvents;
    static XLogRecPtr RecentFlushPtr = InvalidXLogRecPtr;

    /*
     * Fast path to avoid acquiring the spinlock in the we already know we
     * have enough WAL available. This is particularly interesting if we're
     * far behind.
     */
    if (!XLogRecPtrIsInvalid(RecentFlushPtr) && XLByteLE(loc, RecentFlushPtr))
        return RecentFlushPtr;

    /* Get a more recent flush pointer. */
    if (!RecoveryInProgress())
        RecentFlushPtr = GetFlushRecPtr();
    else
        RecentFlushPtr = GetXLogReplayRecPtr(NULL);

    for (;;) {
        long sleeptime;
        TimestampTz now;

        /*
         * Emergency bailout if postmaster has died.  This is to avoid the
         * necessity for manual cleanup of all postmaster children.
         */
        if (!PostmasterIsAlive())
            exit(1);

        WalSndHandleMessage(&RecentFlushPtr);

        /*
         * If postmaster asked us to stop, don't wait here anymore. This will
         * cause the xlogreader to return without reading a full record, which
         * is the fastest way to reach the mainloop which then can quit.
         *
         * It's important to do this check after the recomputation of
         * RecentFlushPtr, so we can send all remaining data before shutting
         * down.
         */
        if (t_thrd.walsender_cxt.walsender_ready_to_stop)
            break;

        /*
         * We only send regular messages to the client for full decoded
         * transactions, but a synchronous replication and walsender shutdown
         * possibly are waiting for a later location. So we send pings
         * containing the flush location every now and then.
         */
        if (!AM_LOGICAL_READ_RECORD) {
            if (XLByteLT(t_thrd.walsender_cxt.MyWalSnd->flush, t_thrd.walsender_cxt.sentPtr) &&
                !t_thrd.walsender_cxt.waiting_for_ping_response) {
                WalSndKeepalive(false);
            }
        }

        /* check whether we're done */
        if (XLByteLE(loc, RecentFlushPtr))
            break;

        /* Waiting for new WAL. Since we need to wait, we're now caught up. */
        t_thrd.walsender_cxt.walSndCaughtUp = true;

        /*
         * Try to flush pending output to the client. Also wait for the socket
         * becoming writable, if there's still pending output after an attempt
         * to flush. Otherwise we might just sit on output data while waiting
         * for new WAL being generated.
         */
        if (pq_flush_if_writable() != 0 || IsLogicalWorkerShutdownRequested())
            WalSndShutdown();

        now = GetCurrentTimestamp();

        sleeptime = WalSndComputeSleeptime(now);

        wakeEvents = WL_LATCH_SET | WL_POSTMASTER_DEATH | WL_SOCKET_READABLE | WL_TIMEOUT;

        if (pq_is_send_pending())
            wakeEvents |= WL_SOCKET_WRITEABLE;

        /* Sleep until something happens or we time out */
        t_thrd.int_cxt.ImmediateInterruptOK = true;
        CHECK_FOR_INTERRUPTS();
        if (!AM_LOGICAL_READ_RECORD) {
            WaitLatchOrSocket(&t_thrd.walsender_cxt.MyWalSnd->latch, wakeEvents, u_sess->proc_cxt.MyProcPort->sock,
                              sleeptime);
        } else if (!XLByteLE(loc, RecentFlushPtr)) {
            pg_usleep(10000L);
        }
        t_thrd.int_cxt.ImmediateInterruptOK = false;
    }

    /* reactivate latch so WalSndLoop knows to continue */
    if (!AM_LOGICAL_READ_RECORD) {
        SetLatch(&t_thrd.walsender_cxt.MyWalSnd->latch);
    }
    return RecentFlushPtr;
}

/*
 * Check cmdString format.
 */
bool cmdStringCheck(const char *cmd_string)
{
    const int maxStack = 100;
    char charStack[maxStack];
    int stackLen = 0;
    for (int i = 0; cmd_string[i] != '\0'; i++) {
        if (cmd_string[i] == '\"') {
            if (stackLen > 0 && charStack[stackLen - 1] == '\"') {
                stackLen--;
            } else {
                charStack[stackLen++] = '\"';
            }
        } else if (cmd_string[i] == '\'') {
            if (stackLen > 0 && charStack[stackLen - 1] == '\'') {
                stackLen--;
            } else {
                charStack[stackLen++] = '\'';
            }
        } else if (cmd_string[i] == '(') {
            charStack[stackLen++] = '(';
        } else if (cmd_string[i] == ')') {
            if (stackLen > 0 && charStack[stackLen - 1] == '(') {
                stackLen--;
            } else {
                return false;
            }
        }
    }
    if (stackLen == 0) {
        return true;
    }
    return false;
}

/*
 *  * Check cmdString length.
 *   */
static bool cmdStringLengthCheck(const char* cmd_string)
{
    const size_t cmd_length_limit = 1024;
    const size_t slotname_limit = 64;
    char comd[cmd_length_limit] = {'\0'};
    char* sub_cmd = NULL;
    char* rm_cmd = NULL;
    char* slot_name = NULL;

    if (cmd_string == NULL) {
        return true;
    }
    size_t cmd_length = strlen(cmd_string);
    if (cmd_length == 0) {
        return true;
    }

    errno_t ret = memset_s(comd, cmd_length_limit, 0, cmd_length_limit);
    securec_check_c(ret, "\0", "\0");
    ret = strncpy_s(comd, cmd_length_limit, cmd_string, Min(cmd_length, cmd_length_limit - 1));
    securec_check_c(ret, "\0", "\0");

    if (cmd_length > strlen("START_REPLICATION") &&
        strncmp(cmd_string, "START_REPLICATION", strlen("START_REPLICATION")) == 0) {
        sub_cmd = strtok_r(comd, " ", &rm_cmd);
        sub_cmd = strtok_r(NULL, " ", &rm_cmd);
        if (sub_cmd == NULL || strlen(sub_cmd) != strlen("SLOT") ||
            strncmp(sub_cmd, "SLOT", strlen("SLOT")) != 0) {
            return true;
        }
    } else if (cmd_length > strlen("CREATE_REPLICATION_SLOT") &&
        strncmp(cmd_string, "CREATE_REPLICATION_SLOT", strlen("CREATE_REPLICATION_SLOT")) == 0) {
        sub_cmd = strtok_r(comd, " ", &rm_cmd);
    } else if (cmd_length > strlen("DROP_REPLICATION_SLOT") &&
        strncmp(cmd_string, "DROP_REPLICATION_SLOT", strlen("DROP_REPLICATION_SLOT")) == 0) {
        sub_cmd = strtok_r(comd, " ", &rm_cmd);
    /* ADVANCE_REPLICATION SLOT slotname LOGICAL %X/%X */
    } else if (cmd_length > strlen("ADVANCE_REPLICATION") &&
        strncmp(cmd_string, "ADVANCE_REPLICATION", strlen("ADVANCE_REPLICATION")) == 0) {
        sub_cmd = strtok_r(comd, " ", &rm_cmd);
        sub_cmd = strtok_r(NULL, " ", &rm_cmd);
        if (sub_cmd == NULL || strlen(sub_cmd) != strlen("SLOT") ||
            strncmp(sub_cmd, "SLOT", strlen("SLOT")) != 0) {
            return true;
        }
    } else {
        return true;
    }
    slot_name = strtok_r(NULL, " ", &rm_cmd);
    if (slot_name == NULL) {
        return true;
    }
    /* if slot_name contains "", its length should minus 2. */
    size_t slot_name_len = strlen(slot_name);
    if (slot_name_len != 0 && slot_name[0] == '"' && slot_name[slot_name_len - 1] == '"') {
        slot_name_len -= 2;
    }
    if (slot_name_len >= slotname_limit) {
        return false;
    }
    return true;
}

bool isLogicalSlotExist(char* slotName)
{
    for (int slotno = 0; slotno < g_instance.attr.attr_storage.max_replication_slots; slotno++) {
        ReplicationSlot *slot = &t_thrd.slot_cxt.ReplicationSlotCtl->replication_slots[slotno];
        if (slot->data.database != InvalidOid &&
            strcmp(slotName, slot->data.name.data) == 0) {
            return true;
        }
    }
    return false;
}

static void IdentifyCommand(Node* cmd_node, ReplicationCxt* repCxt, const char *cmd_string){
    ResourceOwner tmpOwner = t_thrd.utils_cxt.CurrentResourceOwner;
    Assert(tmpOwner != NULL);
    switch (cmd_node->type) {
        case T_AdvanceCatalogXminCmd: {
            AdvanceCatalogXminCmd *cmd = (AdvanceCatalogXminCmd *)cmd_node;
            AdvanceCatalogXmin(cmd);
            repCxt->messageReceiveNoTimeout = true;
            break;
        }

        case T_IdentifySystemCmd:
            IdentifySystem();
            break;

        case T_IdentifyVersionCmd:
            IdentifyVersion();
            break;

        case T_IdentifyModeCmd:
            IdentifyMode();
            break;

        case T_IdentifyMaxLsnCmd:
            IdentifyMaxLsn();
            break;

        case T_IdentifyConsistenceCmd:
            IdentifyConsistence((IdentifyConsistenceCmd *)cmd_node);
            SetReplWalSender();
            break;

        case T_IdentifyChannelCmd:
            IdentifyChannel((IdentifyChannelCmd *)cmd_node);
            break;

#ifndef ENABLE_MULTIPLE_NODES
        case T_IdentifyAZCmd:
            IdentifyAvailableZone();
            break;
#endif
        case T_BaseBackupCmd:
            MarkPostmasterChildNormal();
            SetWalSndPeerMode(STANDBY_MODE);
            SetWalSndPeerDbstate(BUILDING_STATE);

            if (!IS_PGXC_COORDINATOR && IS_DN_DUMMY_STANDYS_MODE())
                StopAliveBuildSender();
            SendBaseBackup((BaseBackupCmd *)cmd_node);

            /* Send CommandComplete and ReadyForQuery messages */
            EndCommand_noblock("SELECT", DestRemote);
            ReadyForQuery_noblock(DestRemote, u_sess->attr.attr_storage.basebackup_timeout * MILLISECONDS_PER_SECONDS);
            /* ReadyForQuery did pq_flush for us */
            /* Audit database recovery */
            pgaudit_system_recovery_ok();
            break;

        case T_CreateReplicationSlotCmd:
            CreateReplicationSlot((CreateReplicationSlotCmd *)cmd_node);
            break;

        case T_DropReplicationSlotCmd:
            DropReplicationSlot((DropReplicationSlotCmd *)cmd_node);
            break;

        case T_StartReplicationCmd: {
            StartReplicationCmd *cmd = (StartReplicationCmd *)cmd_node;
            int parallelDecodeNum = ParseParallelDecodeNumOnly(cmd->options);
            if (cmd->kind == REPLICATION_KIND_PHYSICAL) {
                StartReplication(cmd);
                /* break out of the loop */
                repCxt->replicationStarted = true;
            } else if (t_thrd.proc->workingVersionNum >= PARALLEL_DECODE_VERSION_NUM && parallelDecodeNum > 1) {
                /* if the slot does not exist,the walsender exit */
                if (!isLogicalSlotExist(cmd->slotname)) {
                    ereport(ERROR, (errmodule(MOD_LOGICAL_DECODE), errcode(ERRCODE_LOG),
                        errmsg("Invalid logical replication slot %s.", cmd->slotname), errdetail("N/A"),
                        errcause("Replication slot does not exist."),
                        erraction("Create the replication slot first.")));
                }
                StartLogicalLogWorkers(u_sess->proc_cxt.MyProcPort->user_name,
                    u_sess->proc_cxt.MyProcPort->database_name, cmd->slotname, cmd->options, parallelDecodeNum);
                MarkPostmasterChildNormal();
                StartParallelLogicalReplication(cmd);
            } else {
                MarkPostmasterChildNormal();
                StartLogicalReplication(cmd);
            }
            break;
        }

        case T_AdvanceReplicationCmd: {
            AdvanceReplicationCmd *cmd = (AdvanceReplicationCmd *)cmd_node;
            if (cmd->kind == REPLICATION_KIND_LOGICAL) {
                AdvanceLogicalReplication(cmd);
               /*
                * This connection is used to notify primary to advance logical replication slot,
                * and we don't want it to time out and disconnect.
                */
                repCxt->messageReceiveNoTimeout = true;
            }
            break;
        }

#ifdef ENABLE_MOT
        case T_FetchMotCheckpointCmd:
            PerformMotCheckpointFetch();
            /* Send CommandComplete and ReadyForQuery messages */
            EndCommand_noblock("SELECT", DestRemote);
            ReadyForQuery_noblock(DestRemote, WalSndTimeout());
            break;
#endif

        case T_SQLCmd:
            if (u_sess->proc_cxt.MyDatabaseId == InvalidOid)
                ereport(ERROR, (errmsg("not connected to database")));
            execute_simple_query(cmd_string);
            /* Send CommandComplete and ReadyForQuery messages */
            ReadyForQuery((CommandDest)t_thrd.postgres_cxt.whereToSendOutput);
            break;

        default:
            ereport(FATAL,
                    (errcode(ERRCODE_PROTOCOL_VIOLATION), errmsg("invalid standby query string: %s", cmd_string)));
    }
    t_thrd.utils_cxt.CurrentResourceOwner = tmpOwner;
}

/*
 * Execute an incoming replication command.
 */
static void HandleWalReplicationCommand(const char *cmd_string, ReplicationCxt* repCxt)
{
    int parse_rc;
    Node *cmd_node = NULL;
    MemoryContext cmd_context;
    MemoryContext old_context;
    replication_scanner_yyscan_t yyscanner = NULL;

    /*
     * CREATE_REPLICATION_SLOT ... LOGICAL exports a snapshot until the next
     * command arrives. Clean up the old stuff if there's anything.
     */
    SnapBuildClearExportedSnapshot();

    ereport(LOG, (errmsg("received wal replication command: %s", cmd_string)));

    if (cmdStringCheck(cmd_string) == false) {
        ereport(ERROR, (errcode(ERRCODE_SYNTAX_ERROR), (errmsg_internal("replication command, syntax error."))));
    }

    if (cmdStringLengthCheck(cmd_string) == false) {
        ereport(ERROR, (errcode(ERRCODE_SYNTAX_ERROR),
            (errmsg_internal("replication slot name should be shorter than %d.", NAMEDATALEN))));
    }

    cmd_context = AllocSetContextCreate(CurrentMemoryContext, "Replication command context", ALLOCSET_DEFAULT_MINSIZE,
                                        ALLOCSET_DEFAULT_INITSIZE, ALLOCSET_DEFAULT_MAXSIZE);
    old_context = MemoryContextSwitchTo(cmd_context);

    yyscanner = replication_scanner_init(cmd_string);
    parse_rc = replication_yyparse(yyscanner);
    replication_scanner_finish(yyscanner);

    if (parse_rc != 0) {
        ereport(ERROR,
                (errcode(ERRCODE_SYNTAX_ERROR), (errmsg_internal("replication command parser returned %d", parse_rc))));
    }

    cmd_node = t_thrd.replgram_cxt.replication_parse_result;

    /*
     * CREATE_REPLICATION_SLOT ... LOGICAL exports a snapshot. If it was
     * called outside of transaction the snapshot should be cleared here.
     */
    if (!IsTransactionBlock())
        SnapBuildClearExportedSnapshot();

    /*
     * For aborted transactions, don't allow anything except pure SQL,
     * the exec_simple_query() will handle it correctly.
     */
    if (IsAbortedTransactionBlockState() && !IsA(cmd_node, SQLCmd))
        ereport(ERROR, (errcode(ERRCODE_IN_FAILED_SQL_TRANSACTION), errmsg("current transaction is aborted, "
            "commands ignored until end of transaction block")));

    CHECK_FOR_INTERRUPTS();

    IdentifyCommand(cmd_node, repCxt, cmd_string);

    /* done */
    (void)MemoryContextSwitchTo(old_context);
    MemoryContextDelete(cmd_context);
}

/*
 * Check if the remote end has closed the connection.
 */
static void ProcessRepliesIfAny(void)
{
    unsigned char firstchar;
    int r;
    bool received = false;

    for (;;) {
        r = pq_getbyte_if_available(&firstchar);
        if (r < 0) {
            /* unexpected error or EOF */
            ereport(COMMERROR, (errcode(ERRCODE_PROTOCOL_VIOLATION), errmsg("unexpected EOF on standby connection")));
            proc_exit(0);
        }
        if (r == 0) {
            /* no data available without blocking */
            break;
        }

        /* Handle the very limited subset of commands expected in this phase */
        switch (firstchar) {
                /*
                 * 'd' means a standby reply wrapped in a CopyData packet.
                 */
            case 'd':
                ProcessStandbyMessage();
                received = true;
                break;

                /*
                 * 'X' means that the standby is closing down the socket.
                 */
            case 'c':
            case 'X':
                proc_exit(0);
                /* fall-through */
            default:
                ereport(FATAL, (errcode(ERRCODE_PROTOCOL_VIOLATION),
                                errmsg("invalid standby message type \"%c\"", firstchar)));
        }
    }

    /*
     * Save the last reply timestamp if we've received at least one reply.
     */
    if (received) {
        t_thrd.walsender_cxt.last_reply_timestamp = GetCurrentTimestamp();
        t_thrd.walsender_cxt.waiting_for_ping_response = false;
    } else {
        TimestampTz now = GetCurrentTimestamp();
        /* Check for replication timeout. */
        WalSndCheckTimeOut(now);
        /* Send keepalive if the time has come. */
        WalSndKeepaliveIfNecessary(now);
    }
}

/*
 * Process a status update message received from standby.
 */
static void ProcessStandbyMessage(void)
{
    char msgtype;

    resetStringInfo(t_thrd.walsender_cxt.reply_message);

    /*
     * Read the message contents.
     */
    if (pq_getmessage(t_thrd.walsender_cxt.reply_message, 0)) {
        ereport(COMMERROR, (errcode(ERRCODE_PROTOCOL_VIOLATION), errmsg("unexpected EOF on standby connection")));
        proc_exit(0);
    }

    /*
     * Check message type from the first byte.
     */
    msgtype = pq_getmsgbyte(t_thrd.walsender_cxt.reply_message);

    switch (msgtype) {
        case 'r':
            ProcessStandbyReplyMessage();
            break;

        case 'h':
            ProcessStandbyHSFeedbackMessage();
            break;

        case 's':
            ProcessStandbySwitchRequestMessage();
            break;

        case 'A':
            ProcessStandbyFileTimeMessage();
            break;

        case 'a':
            ProcessArchiveFeedbackMessage();
            break;

        case 'S':
            ProcessHadrSwitchoverMessage();
            break;

        case 'R':
            ProcessHadrReplyMessage();
            break;

        case 'b':
            SendPostmasterSignal(PMSIGNAL_SWITCHOVER_TIMEOUT);
            break;

        default:
            ereport(COMMERROR,
                    (errcode(ERRCODE_PROTOCOL_VIOLATION), errmsg("unexpected message type \"%d\"", msgtype)));
            proc_exit(0);
    }
}

/*
 * Remember that a walreceiver just confirmed receipt of lsn `lsn`.
 */
static void PhysicalConfirmReceivedLocation(XLogRecPtr lsn)
{
    bool changed = false;
    /* use volatile pointer to prevent code rearrangement */
    volatile ReplicationSlot *slot = t_thrd.slot_cxt.MyReplicationSlot;

    Assert(!XLByteEQ(lsn, InvalidXLogRecPtr));
    /* not update in boundary */
    if (lsn % XLogSegSize == 0) {
        return;
    }
    SpinLockAcquire(&slot->mutex);
    if (!XLByteEQ(slot->data.restart_lsn, lsn)) {
        changed = true;
        slot->data.restart_lsn = lsn;
    }
    SpinLockRelease(&slot->mutex);

    if (changed) {
        ReplicationSlotMarkDirty();
        ReplicationSlotsComputeRequiredLSN(NULL);
    }

    /*
     * One could argue that the slot should saved to disk now, but that'd be
     * energy wasted - the worst lost information can do here is give us wrong
     * information in a statistics view - we'll just potentially be more
     * conservative in removing files.
     */
}

/*
 * Regular request from standby to send config file.
 */
static void ProcessStandbyFileTimeMessage(void)
{
    ConfigModifyTimeMessage reply_modify_file_time;
    struct stat statbuf;

    pq_copymsgbytes(t_thrd.walsender_cxt.reply_message, (char *)&reply_modify_file_time,
                    sizeof(ConfigModifyTimeMessage));
    if (lstat(t_thrd.walsender_cxt.gucconf_file, &statbuf) != 0) {
        if (errno != ENOENT)
            ereport(ERROR, (errcode_for_file_access(),
                            errmsg("could not stat file or directory \"%s\": %m", t_thrd.walsender_cxt.gucconf_file)));
    }
    if (reply_modify_file_time.config_modify_time != statbuf.st_mtime) {
        ereport(LOG, (errmsg("the config file has been modified, so send it to the standby")));
        (void)SendConfigFile(t_thrd.walsender_cxt.gucconf_file);
    } else
        ereport(LOG, (errmsg("the config file has no change")));
}

char *remote_role_to_string(int role)
{
    switch (role) {
        case SNDROLE_PRIMARY_STANDBY:
            return "STANDBY";
            break;
        case SNDROLE_PRIMARY_BUILDSTANDBY:
            return "BUILD_STANDBY";
            break;
        case SNDROLE_PRIMARY_DUMMYSTANDBY:
            return "DUMMYSTANDBY";
            break;
        case SNDROLE_DUMMYSTANDBY_STANDBY:
            return "DSTANDBY";
            break;
        default:
            break;
    }

    return "UNKNOW";
}

/*
 * When flush_lsn exceeds min_restart_lsn by a margin of max_keep_log_seg,
 * walsender stream limitation is triggered.
 */
static bool LogicalSlotSleepFlag(void)
{
    const int xlog_offset = 24;
    const int sleep_time_unit = 100000;
    int64 max_keep_log_seg = (int64)g_instance.attr.attr_storage.max_keep_log_seg;
    if (max_keep_log_seg <= 0) {
        return false;
    }
    XLogRecPtr min_restart_lsn = InvalidXLogRecPtr;
    for (int i = 0; i < g_instance.attr.attr_storage.max_replication_slots; i++) {
        ReplicationSlot *s = &t_thrd.slot_cxt.ReplicationSlotCtl->replication_slots[i];

        if (s->in_use && s->data.database != InvalidOid) {
            min_restart_lsn = min_restart_lsn == InvalidXLogRecPtr ? s->data.restart_lsn
                                                                    : Min(min_restart_lsn, s->data.restart_lsn);
        }
    }
    if (min_restart_lsn == InvalidXLogRecPtr) {
        return false;
    }
    XLogRecPtr flush_lsn = GetFlushRecPtr();
    if (((flush_lsn - min_restart_lsn) >> xlog_offset) > (uint64)max_keep_log_seg) {
        g_logical_slot_sleep_time += sleep_time_unit;
        if (g_logical_slot_sleep_time > MICROSECONDS_PER_SECONDS) {
            g_logical_slot_sleep_time = MICROSECONDS_PER_SECONDS;
        }
        ereport(LOG,
                (errmsg("flush_lsn %X/%X exceed min_restart_lsn %X/%X by threshold %ld, sleep time increase by 0.1s.\n",
                        (uint32)(flush_lsn >> 32), (uint32)flush_lsn, (uint32)(min_restart_lsn >> 32),
                        (uint32)min_restart_lsn, max_keep_log_seg)));
        return true;
    } else {
        g_logical_slot_sleep_time = 0;
    }
    return false;
}

static void LogCtrlDoActualSleep(volatile WalSnd *walsnd, bool forceUpdate)
{
    bool logical_slot_sleep_flag = LogicalSlotSleepFlag();
    /* try to control log sent rate so that standby can flush and apply log under RTO seconds */
    if (walsnd->state > WALSNDSTATE_BACKUP &&
        (IS_PGXC_DATANODE || AM_WAL_HADR_CN_SENDER || AM_WAL_SHARE_STORE_SENDER)) {
        if (AM_WAL_HADR_DNCN_SENDER || AM_WAL_SHARE_STORE_SENDER) {
            if (u_sess->attr.attr_storage.hadr_recovery_time_target > 0 ||
                u_sess->attr.attr_storage.hadr_recovery_point_target > 0) {
                LogCtrlExecuteSleeping(walsnd, forceUpdate, logical_slot_sleep_flag);
            } else {
                if (logical_slot_sleep_flag && !IS_SHARED_STORAGE_MODE && !SS_REPLICATION_DORADO_CLUSTER) {
                    pg_usleep(g_logical_slot_sleep_time);
                }
            }
        } else {
            if (u_sess->attr.attr_storage.target_rto > 0) {
                LogCtrlExecuteSleeping(walsnd, forceUpdate, logical_slot_sleep_flag);
            } else {
                if (logical_slot_sleep_flag && !IS_SHARED_STORAGE_MODE && !SS_REPLICATION_DORADO_CLUSTER) {
                    pg_usleep(g_logical_slot_sleep_time);
                }
            }
        }
    }
    walsnd->log_ctrl.sleep_count++;
}

static void LogCtrlExecuteSleeping(volatile WalSnd *walsnd, bool forceUpdate, bool logicalSlotSleepFlag)
{
    if (walsnd->log_ctrl.sleep_count % walsnd->log_ctrl.sleep_count_limit == 0 || forceUpdate) {
        /* calculate RPO sleep time */
        if (AM_WAL_HADR_DNCN_SENDER && (u_sess->attr.attr_storage.hadr_recovery_point_target > 0)) {
            LogCtrlCalculateSleepTime(g_instance.streaming_dr_cxt.rpoSleepTime,
                g_instance.streaming_dr_cxt.rpoBalanceSleepTime, true);
        }
        /* calculate RTO sleep time */
        if (AM_WAL_HADR_DNCN_SENDER || AM_WAL_SHARE_STORE_SENDER) {
            if (u_sess->attr.attr_storage.hadr_recovery_time_target > 0) {
                LogCtrlCalculateSleepTime(walsnd->log_ctrl.sleep_time, walsnd->log_ctrl.balance_sleep_time, false);
            }
        } else {
            if (u_sess->attr.attr_storage.target_rto > 0) {
                LogCtrlCalculateSleepTime(walsnd->log_ctrl.sleep_time, walsnd->log_ctrl.balance_sleep_time, false);
            }
        }
        LogCtrlCountSleepLimit();
    }
    LogCtrlSleep();
    if (logicalSlotSleepFlag && g_logical_slot_sleep_time > t_thrd.walsender_cxt.MyWalSnd->log_ctrl.sleep_time &&
        !IS_SHARED_STORAGE_MODE && !SS_REPLICATION_DORADO_CLUSTER) {
        pg_usleep(g_logical_slot_sleep_time - t_thrd.walsender_cxt.MyWalSnd->log_ctrl.sleep_time);
    }
}

static void LogCtrlNeedForceUpdate(bool *forceUpdate, const StandbyReplyMessage *reply)
{
    /* use volatile pointer to prevent code rearrangement */
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    long millisec_time_diff = 0;
    if (walsnd->log_ctrl.prev_reply_time > 0) {
        long sec_to_time;
        int microsec_to_time;
        TimestampDifference(walsnd->log_ctrl.prev_reply_time, reply->sendTime, &sec_to_time, &microsec_to_time);
        millisec_time_diff = sec_to_time * MILLISECONDS_PER_SECONDS
            + microsec_to_time / MILLISECONDS_PER_MICROSECONDS;
        *forceUpdate = millisec_time_diff > MILLISECONDS_PER_SECONDS;
    }
}

static bool IsRtoRpoOverTarget()
{
    /* use volatile pointer to prevent code rearrangement */
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    if (AM_WAL_HADR_DNCN_SENDER || AM_WAL_SHARE_STORE_SENDER) {
        if ((u_sess->attr.attr_storage.hadr_recovery_time_target != 0 &&
            walsnd->log_ctrl.current_RTO > u_sess->attr.attr_storage.hadr_recovery_time_target) ||
            (u_sess->attr.attr_storage.hadr_recovery_point_target != 0 &&
            walsnd->log_ctrl.current_RPO > u_sess->attr.attr_storage.hadr_recovery_point_target)) {
            return true;
        }
    } else {
        if ((u_sess->attr.attr_storage.target_rto != 0 &&
            walsnd->log_ctrl.current_RTO > u_sess->attr.attr_storage.target_rto)) {
            return true;
        }
    }
    return false;
}

static void ProcessTargetRtoRpoChanged()
{
    /* use volatile pointer to prevent code rearrangement */
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    char *standby_name = (char *)(g_instance.rto_cxt.rto_standby_data[walsnd->index].id);
    int rc = strncpy_s(standby_name, NODENAMELEN, u_sess->attr.attr_common.application_name,
                       strlen(u_sess->attr.attr_common.application_name));
    securec_check(rc, "\0", "\0");

    if (AM_WAL_HADR_DNCN_SENDER || AM_WAL_SHARE_STORE_SENDER) {
        if (u_sess->attr.attr_storage.hadr_recovery_time_target == 0) {
            g_instance.rto_cxt.rto_standby_data[walsnd->index].current_sleep_time = 0;
            walsnd->log_ctrl.sleep_time = 0;
        } else {
            g_instance.rto_cxt.rto_standby_data[walsnd->index].current_sleep_time = walsnd->log_ctrl.sleep_time;
        }

        if (u_sess->attr.attr_storage.hadr_recovery_point_target == 0) {
            g_instance.streaming_dr_cxt.rpoSleepTime = 0;
        }

        if (g_instance.rto_cxt.rto_standby_data[walsnd->index].target_rto !=
            u_sess->attr.attr_storage.hadr_recovery_time_target) {
            ereport(LOG, (errmodule(MOD_RTO_RPO),
                          errmsg("hadr_target_rto changes to %d, previous target_rto is %d, "
                                 "current the sleep time is %ld",
                                 u_sess->attr.attr_storage.hadr_recovery_time_target,
                                 g_instance.rto_cxt.rto_standby_data[walsnd->index].target_rto,
                                 g_instance.rto_cxt.rto_standby_data[walsnd->index].current_sleep_time)));

            g_instance.rto_cxt.rto_standby_data[walsnd->index].target_rto =
                u_sess->attr.attr_storage.hadr_recovery_time_target;
        }
    } else {
        if (u_sess->attr.attr_storage.target_rto == 0) {
            g_instance.rto_cxt.rto_standby_data[walsnd->index].current_sleep_time = 0;
            walsnd->log_ctrl.sleep_time = 0;
        } else {
            g_instance.rto_cxt.rto_standby_data[walsnd->index].current_sleep_time = walsnd->log_ctrl.sleep_time;
        }

        if (g_instance.rto_cxt.rto_standby_data[walsnd->index].target_rto != u_sess->attr.attr_storage.target_rto) {
            ereport(LOG, (errmodule(MOD_RTO_RPO),
                          errmsg("target_rto changes to %d, previous target_rto is %d, current the sleep time is %ld",
                                 u_sess->attr.attr_storage.target_rto,
                                 g_instance.rto_cxt.rto_standby_data[walsnd->index].target_rto,
                                 g_instance.rto_cxt.rto_standby_data[walsnd->index].current_sleep_time)));

            g_instance.rto_cxt.rto_standby_data[walsnd->index].target_rto = u_sess->attr.attr_storage.target_rto;
        }
    }
}

static void AdvanceReplicationSlot(XLogRecPtr flush)
{
    if (t_thrd.walsender_cxt.LogicalSlot != -1) {
        int slotId = t_thrd.walsender_cxt.LogicalSlot;
        SpinLockAcquire(&(g_Logicaldispatcher[slotId].readWorker->rwlock));
        g_Logicaldispatcher[slotId].readWorker->flushLSN = flush;
        SpinLockRelease(&(g_Logicaldispatcher[slotId].readWorker->rwlock));
    }
    if (t_thrd.slot_cxt.MyReplicationSlot && (!XLByteEQ(flush, InvalidXLogRecPtr))) {
        if (t_thrd.slot_cxt.MyReplicationSlot->data.database != InvalidOid) {
            LogicalConfirmReceivedLocation(flush);
            if (RecoveryInProgress() && OidIsValid(t_thrd.slot_cxt.MyReplicationSlot->data.database)) {
                TimestampTz timegap;
                TimestampTz now;

                /*
                 * Check if time since last notify primary logical slot advancing has reached the limit.
                 * If reached, notify primary advance logical slot.
                 */
                if (t_thrd.walsender_cxt.last_logical_slot_advanced_timestamp <= 0) {
                    return;
                }
                now = GetCurrentTimestamp();
                timegap = TimestampTzPlusMilliseconds(t_thrd.walsender_cxt.last_logical_slot_advanced_timestamp,
                                                      t_thrd.walsender_cxt.logical_slot_advanced_timeout);
                if (now < timegap) {
                    return;
                }
                t_thrd.walsender_cxt.last_logical_slot_advanced_timestamp = now;

                /* Notify the primary to advance logical slot location */
                NotifyPrimaryAdvance(t_thrd.slot_cxt.MyReplicationSlot->data.restart_lsn, flush);
                NotifyPrimaryCatalogXmin(t_thrd.slot_cxt.MyReplicationSlot->data.catalog_xmin);
            }
        } else {
            PhysicalConfirmReceivedLocation(flush);
        }
    }
}

static void ProcessLogCtrl(StandbyReplyMessage reply)
{
    /* use volatile pointer to prevent code rearrangement */
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    bool forceUpdate = false;
    LogCtrlNeedForceUpdate(&forceUpdate, &reply);
    if (NEED_CALCULATE_RTO) {
        bool needRefresh = true;
        LogCtrlCalculateCurrentRTO(&reply, &needRefresh);
#ifndef ENABLE_MULTIPLE_NODES
        if ((AM_WAL_HADR_DNCN_SENDER || AM_WAL_SHARE_STORE_SENDER) && needRefresh) {
            LogCtrlCalculateCurrentRPO(&reply);
        }
#else
        if (AM_WAL_SHARE_STORE_SENDER && needRefresh) {
            LogCtrlCalculateCurrentRPO(&reply);
        } else if (AM_WAL_HADR_DNCN_SENDER && needRefresh) {
            LogCtrlCalculateHadrCurrentRPO();
        }
#endif
        if (needRefresh) {
            walsnd->log_ctrl.prev_reply_time = reply.sendTime;
            walsnd->log_ctrl.prev_flush = reply.flush;
            walsnd->log_ctrl.prev_apply = reply.apply;
        }
    }
    LogCtrlDoActualSleep(walsnd, forceUpdate);
}

/*
 * Regular reply from standby advising of WAL positions on standby server.
 */
static void ProcessStandbyReplyMessage(void)
{
    StandbyReplyMessage reply;
    XLogRecPtr sndFlush = InvalidXLogRecPtr;
    pq_copymsgbytes(t_thrd.walsender_cxt.reply_message, (char *)&reply, sizeof(StandbyReplyMessage));

    ereport(DEBUG2, (errmsg("receive %X/%X write %X/%X flush %X/%X apply %X/%X", (uint32)(reply.receive >> 32),
                            (uint32)reply.receive, (uint32)(reply.write >> 32), (uint32)reply.write,
                            (uint32)(reply.flush >> 32), (uint32)reply.flush, (uint32)(reply.apply >> 32),
                            (uint32)reply.apply)));

    /* send a reply if the standby requested one */
    if (reply.replyRequested) {
        WalSndKeepalive(false);
    }

    if ((reply.replyFlags & IS_CANCEL_LOG_CTRL) != 0) {
        t_thrd.walsender_cxt.cancelLogCtl = true;
    } else {
        t_thrd.walsender_cxt.cancelLogCtl = false;
    }
    /* use volatile pointer to prevent code rearrangement */
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    TimestampTz now = GetCurrentTimestamp();
    XLogRecPtr localFlush = GetFlushRecPtr();

    /*
     * Update shared state for this WalSender process based on reply data from
     * standby.
     */
    {
        SpinLockAcquire(&walsnd->mutex);
        /*
         * If reply position is bigger than last one, or equal to local flush,
         * update change time.
         */
        walsnd->lastReceiveChangeTime = XLByteLT(walsnd->receive, reply.receive) ||
            XLByteEQ(walsnd->receive, localFlush) ? now : walsnd->lastReceiveChangeTime;
        walsnd->lastWriteChangeTime = XLByteLT(walsnd->write, reply.write) ||
            XLByteEQ(walsnd->write, localFlush) ? now : walsnd->lastWriteChangeTime;
        walsnd->lastFlushChangeTime = XLByteLT(walsnd->flush, reply.flush) ||
            XLByteEQ(walsnd->flush, localFlush) ? now : walsnd->lastFlushChangeTime;
        walsnd->lastApplyChangeTime = XLByteLT(walsnd->apply, reply.apply) ||
            XLByteEQ(walsnd->apply, localFlush) ? now : walsnd->lastApplyChangeTime;
        walsnd->receive = reply.receive;
        walsnd->write = reply.write;
        walsnd->flush = reply.flush;
        walsnd->apply = reply.apply;
        walsnd->peer_role = reply.peer_role;
        walsnd->peer_state = reply.peer_state;
        walsnd->replyFlags = reply.replyFlags;
        SpinLockRelease(&walsnd->mutex);
    }

    /*
     * Only sleep when local role is not WAL_DB_SENDER.
     */
    if (!t_thrd.walsender_cxt.cancelLogCtl && !AM_WAL_DB_SENDER &&
        walsnd->sendRole != SNDROLE_PRIMARY_BUILDSTANDBY) {
        ProcessLogCtrl(reply);
    }

    if (IS_PGXC_DATANODE || AM_WAL_HADR_CN_SENDER) {
        ProcessTargetRtoRpoChanged();
    }

    if (!AM_WAL_STANDBY_SENDER) {
        SyncRepReleaseWaiters();
    }

    /*
     * Advance our local xmin horizon when the client confirmed a flush.
     * 1. When starting ss dorado replication, we need to know replayPtr that standby has already replayed,
     * because primary xlog will cover standby xlog by Dorado synchronous replication.
     * 2. Otherwise, we only need to confirm that standby xlog has been flushed successfully.
     */
    if (SS_REPLICATION_DORADO_CLUSTER) {
        AdvanceReplicationSlot(reply.apply);
    } else {
        AdvanceReplicationSlot(reply.flush);
    }

    if (AM_WAL_STANDBY_SENDER) {
        sndFlush = GetFlushRecPtr();
        WalSndRefreshPercentCountStartLsn(sndFlush, reply.flush);
    }
}

/* compute new replication slot xmin horizon if needed */
static void PhysicalReplicationSlotNewXmin(TransactionId feedbackXmin)
{
    bool changed = false;
    volatile ReplicationSlot *slot = t_thrd.slot_cxt.MyReplicationSlot;

    SpinLockAcquire(&slot->mutex);
    t_thrd.pgxact->xmin = InvalidTransactionId;
    t_thrd.proc->exrto_read_lsn = 0;
    t_thrd.proc->exrto_min = 0;
    t_thrd.proc->exrto_gen_snap_time = 0;
    /*
     * For physical replication we don't need the the interlock provided
     * by xmin and effective_xmin since the consequences of a missed increase
     * are limited to query cancellations, so set both at once.
     */
    if (!TransactionIdIsNormal(slot->data.xmin) || !TransactionIdIsNormal(feedbackXmin) ||
        TransactionIdPrecedes(slot->data.xmin, feedbackXmin)) {
        changed = true;
        slot->data.xmin = feedbackXmin;
        slot->effective_xmin = feedbackXmin;
    }
    slot->last_xmin_change_time = GetCurrentTimestamp();
    SpinLockRelease(&slot->mutex);

    if (changed) {
        ReplicationSlotMarkDirty();
        ReplicationSlotsComputeRequiredXmin(false);
    }
}

/*
 * Hot Standby feedback
 */
static void ProcessStandbyHSFeedbackMessage(void)
{
    StandbyHSFeedbackMessage reply;
    TransactionId nextXid;

    /* Decipher the reply message */
    pq_copymsgbytes(t_thrd.walsender_cxt.reply_message, (char *)&reply, sizeof(StandbyHSFeedbackMessage));

    ereport(DEBUG2, (errmsg("hot standby feedback xmin " XID_FMT, reply.xmin)));

    /* Ignore invalid xmin (can't actually happen with current walreceiver) */
    if (!TransactionIdIsNormal(reply.xmin)) {
        if (t_thrd.slot_cxt.MyReplicationSlot != NULL)
            PhysicalReplicationSlotNewXmin(reply.xmin);
        return;
    }
    nextXid = ReadNewTransactionId();
    if (!TransactionIdPrecedesOrEquals(reply.xmin, nextXid)) {
        /* epoch OK, but it's wrapped around */
        return;
    }

    /*
     * Set the WalSender's xmin equal to the standby's requested xmin, so that
     * the xmin will be taken into account by GetOldestXmin.  This will hold
     * back the removal of dead rows and thereby prevent the generation of
     * cleanup conflicts on the standby server.
     *
     * There is a small window for a race condition here: although we just
     * checked that reply.xmin precedes nextXid, the nextXid could have gotten
     * advanced between our fetching it and applying the xmin below, perhaps
     * far enough to make reply.xmin wrap around.  In that case the xmin we
     * set here would be "in the future" and have no effect.  No point in
     * worrying about this since it's too late to save the desired data
     * anyway.	Assuming that the standby sends us an increasing sequence of
     * xmins, this could only happen during the first reply cycle, else our
     * own xmin would prevent nextXid from advancing so far.
     *
     * We don't bother taking the ProcArrayLock here.  Setting the xmin field
     * is assumed atomic, and there's no real need to prevent a concurrent
     * GetOldestXmin.  (If we're moving our xmin forward, this is obviously
     * safe, and if we're moving it backwards, well, the data is at risk
     * already since a VACUUM could have just finished calling GetOldestXmin.)
     */
    /* If we're using a replication slot we reserve the xmin via that,
     * otherwise via the walsender's PGXACT entry.

     * XXX: It might make sense to introduce ephemeral slots and always use
     * the slot mechanism.
     */
    /* XXX: persistency configurable? */
    if (t_thrd.slot_cxt.MyReplicationSlot != NULL) {
        PhysicalReplicationSlotNewXmin(reply.xmin);
    } else {
        t_thrd.pgxact->xmin = reply.xmin;
    }
}

/*
 * process message from standby request primary server making switchover.
 */
static void ProcessStandbySwitchRequestMessage(void)
{
    int i;
    StandbySwitchRequestMessage message;

    pq_copymsgbytes(t_thrd.walsender_cxt.reply_message, (char *)&message, sizeof(StandbySwitchRequestMessage));

    if (message.demoteMode < SmartDemote || message.demoteMode > ExtremelyFast) {
        ereport(WARNING,
                (errmsg("invalid switchover mode in standby switchover request message: %d", message.demoteMode)));
        return;
    } else if (message.demoteMode == ExtremelyFast){
        g_instance.wal_cxt.upgradeSwitchMode = ExtremelyFast;
    }

    SpinLockAcquire(&t_thrd.walsender_cxt.WalSndCtl->mutex);

    /*
     * If the catchup thread is alive, we must stop the demoting process
     * at once. There will be some risk of losting data when catchup can't send the data pages.
     */
    if (catchup_online) {
        volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
        ClusterNodeState old_mode = walsnd->node_state;

        walsnd->node_state = NODESTATE_PRIMARY_DEMOTING_WAIT_CATCHUP;
        WalSndResponseSwitchover(t_thrd.walsender_cxt.output_xlog_message);
        walsnd->node_state = old_mode;

        SpinLockRelease(&t_thrd.walsender_cxt.WalSndCtl->mutex);
        ereport(NOTICE, (errmsg("could not continuing switchover process when catchup is alive.")));
        return;
    }
    if (t_thrd.walsender_cxt.WalSndCtl->demotion > NoDemote &&
        t_thrd.walsender_cxt.Demotion != t_thrd.walsender_cxt.WalSndCtl->demotion) {
        SpinLockRelease(&t_thrd.walsender_cxt.WalSndCtl->mutex);
        ereport(NOTICE, (errmsg("master is doing switchover,\
                                probably another standby already requested switchover.")));
        return;
    } else if (message.demoteMode <= t_thrd.walsender_cxt.Demotion) {
        SpinLockRelease(&t_thrd.walsender_cxt.WalSndCtl->mutex);
        ereport(NOTICE, (errmsg("the standby already requested %s switchover, so ignore new %s switchover request.",
                                DemoteModeDesc(t_thrd.walsender_cxt.Demotion), DemoteModeDesc(message.demoteMode))));
        return;
    }

    t_thrd.walsender_cxt.WalSndCtl->demotion = (DemoteMode)message.demoteMode;

    /* update the demote state */
    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];

        if (walsnd->pid == 0) {
            continue;
        }

        walsnd->node_state = NODESTATE_PRIMARY_DEMOTING;
    }
    t_thrd.walsender_cxt.MyWalSnd->node_state = (ClusterNodeState)message.demoteMode;

    SpinLockRelease(&t_thrd.walsender_cxt.WalSndCtl->mutex);

    t_thrd.walsender_cxt.Demotion = (DemoteMode)message.demoteMode;
    ereport(LOG,
            (errmsg("received %s switchover request from standby", DemoteModeDesc(t_thrd.walsender_cxt.Demotion))));

    SendPostmasterSignal(PMSIGNAL_DEMOTE_PRIMARY);
}

/*
 * Hot Standby feedback
 */
static void ProcessArchiveFeedbackMessage(void)
{
    ArchiveXlogResponseMessage reply;
    /* Decipher the reply message */
    pq_copymsgbytes(t_thrd.walsender_cxt.reply_message, (char*)&reply, sizeof(ArchiveXlogResponseMessage));
    ereport(LOG,
        (errmsg("ProcessArchiveFeedbackMessage %s : %d %X/%X",
            reply.slot_name, reply.pitr_result, (uint32)(reply.targetLsn >> 32), (uint32)(reply.targetLsn))));


    ArchiveTaskStatus *archive_task_status = NULL;
    archive_task_status = find_archive_task_status(reply.slot_name);
    if (archive_task_status == NULL) {
        ereport(ERROR,
            (errmsg("ProcessArchiveFeedbackMessage %s : %d %X/%X, but not find slot",
                reply.slot_name, reply.pitr_result, (uint32)(reply.targetLsn >> 32), (uint32)(reply.targetLsn))));
    }
    SpinLockAcquire(&archive_task_status->mutex);
    archive_task_status->pitr_finish_result = reply.pitr_result;
    archive_task_status->archive_task.targetLsn = reply.targetLsn;
    SpinLockRelease(&archive_task_status->mutex);
    if (archive_task_status->archiver_latch == NULL) {
        /*
        * slave send feedback message for the arch request that sent during last restart,
        * and arch thread is not start yet, so we ignore this message unti arch thread is normal
        */
        ereport(WARNING,
            (errmsg("master received archive feedback message, but arch not work yet  %d %X/%X", reply.pitr_result,
                (uint32)(reply.targetLsn >> 32), (uint32)(reply.targetLsn))));
        return ;
    }
    SetLatch(archive_task_status->archiver_latch);
}

/*
 * Count the limit for sleep_count, it is based on sleep time.
 */
static void LogCtrlCountSleepLimit(void)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    int64 countLimit1;
    int64 countLimit2;

    if (walsnd->log_ctrl.sleep_time == 0) {
        countLimit1 = MAX_CONTROL_REPLY;
    } else {
        countLimit1 = INIT_CONTROL_REPLY * MICROSECONDS_PER_SECONDS / walsnd->log_ctrl.sleep_time;
        countLimit1 = (countLimit1 > MAX_CONTROL_REPLY) ? MAX_CONTROL_REPLY : countLimit1;
        countLimit1 = (countLimit1 <= 0) ? INIT_CONTROL_REPLY : countLimit1;
    }
    if (g_instance.streaming_dr_cxt.rpoSleepTime == 0) {
        countLimit2 = MAX_CONTROL_REPLY;
    } else {
        countLimit2 = INIT_CONTROL_REPLY * MICROSECONDS_PER_SECONDS / g_instance.streaming_dr_cxt.rpoSleepTime;
        countLimit2 = (countLimit2 > MAX_CONTROL_REPLY) ? MAX_CONTROL_REPLY : countLimit2;
        countLimit2 = (countLimit2 <= 0) ? INIT_CONTROL_REPLY : countLimit2;
    }
    walsnd->log_ctrl.sleep_count_limit = (countLimit1 <= countLimit2) ? countLimit1 : countLimit2;
}

/*
 * Update the sleep time for primary.
 */
static void LogCtrlSleep(void)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    if (IS_SHARED_STORAGE_MODE || SS_REPLICATION_DORADO_CLUSTER) {
        if (walsnd->log_ctrl.sleep_time > MICROSECONDS_PER_SECONDS) {
            walsnd->log_ctrl.sleep_time = MICROSECONDS_PER_SECONDS;
        }
        g_instance.rto_cxt.rto_standby_data[walsnd->index].current_sleep_time = walsnd->log_ctrl.sleep_time;
        return;
    }
    if (walsnd->log_ctrl.sleep_time > 0) {
        ereport(DEBUG4, (errmodule(MOD_RTO_RPO), errmsg("LogCtrlSleep:%lu", walsnd->log_ctrl.sleep_time)));
    }
    if (walsnd->log_ctrl.sleep_time > 0 && walsnd->log_ctrl.sleep_time <= MICROSECONDS_PER_SECONDS) {
        pgstat_report_waitevent(WAIT_EVENT_LOGCTRL_SLEEP);
        pg_usleep_retry(walsnd->log_ctrl.sleep_time, 0);
        pgstat_report_waitevent(WAIT_EVENT_END);
    } else if (walsnd->log_ctrl.sleep_time > MICROSECONDS_PER_SECONDS) {
        pgstat_report_waitevent(WAIT_EVENT_LOGCTRL_SLEEP);
        pg_usleep_retry(MICROSECONDS_PER_SECONDS, 0);
        pgstat_report_waitevent(WAIT_EVENT_END);
        walsnd->log_ctrl.sleep_time = MICROSECONDS_PER_SECONDS;
    }
    g_instance.rto_cxt.rto_standby_data[walsnd->index].current_sleep_time = walsnd->log_ctrl.sleep_time;
}

static inline uint64 LogCtrlCountBigSpeed(uint64 originSpeed, uint64 curSpeed)
{
    uint64 updateSpeed = (((originSpeed << SHIFT_SPEED) - originSpeed) >> SHIFT_SPEED) + curSpeed;
    return updateSpeed;
}

static bool ReplyMessageCheck(StandbyReplyMessage *reply, bool *needRefresh)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    bool checkResult = true;
    if (XLByteLT(reply->receive, reply->flush) || XLByteLT(reply->flush, reply->apply) ||
        XLByteLT(reply->flush, walsnd->log_ctrl.prev_flush) || XLByteLT(reply->apply, walsnd->log_ctrl.prev_apply)) {
        checkResult = false;
    }
    if (XLByteEQ(reply->receive, reply->apply)) {
        walsnd->log_ctrl.prev_RTO = walsnd->log_ctrl.current_RTO;
        walsnd->log_ctrl.current_RTO = 0;
        checkResult = false;
    }
    if (AM_WAL_HADR_DNCN_SENDER) {
        if (!STANDBY_IN_BARRIER_PAUSE && reply->apply == walsnd->log_ctrl.prev_apply) {
            *needRefresh = false;
            checkResult = false;
        }
        ereport(DEBUG4, (errmodule(MOD_RTO_RPO),
            errmsg("reply->replyFlags is %d, reply->reveive is %lu, reply->flush is %lu, reply->apply is %lu",
                   reply->replyFlags, reply->receive, reply->flush, reply->apply)));
    }
    if (walsnd->log_ctrl.prev_reply_time == 0) {
        checkResult = false;
    }
    if (walsnd->log_ctrl.prev_calculate_time == 0 || (!checkResult && *needRefresh)) {
        walsnd->log_ctrl.prev_calculate_time = reply->sendTime;
        walsnd->log_ctrl.period_total_flush = 0;
        walsnd->log_ctrl.period_total_apply = 0;
        checkResult = false;
    }
    g_instance.rto_cxt.rto_standby_data[walsnd->index].current_rto = walsnd->log_ctrl.current_RTO;
    return checkResult;
}

/*
 * Estimate the time standby need to flush and apply log.
 */
static void LogCtrlCalculateCurrentRTO(StandbyReplyMessage *reply, bool *needRefresh)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    long sec_to_time;
    int microsec_to_time;

    if (!ReplyMessageCheck(reply, needRefresh)) {
        return;
    }

    TimestampDifference(walsnd->log_ctrl.prev_reply_time, reply->sendTime, &sec_to_time, &microsec_to_time);
    long millisec_time_diff = sec_to_time * MILLISECONDS_PER_SECONDS +
        microsec_to_time / MILLISECONDS_PER_MICROSECONDS;
    if (millisec_time_diff <= 100) {
        *needRefresh = false;
        return;
    }

    uint64 needFlush = reply->receive - reply->flush;
    uint64 needApply = reply->flush - reply->apply;
    uint64 newFlush = reply->flush - walsnd->log_ctrl.prev_flush;
    uint64 newApply = reply->apply - walsnd->log_ctrl.prev_apply;
    uint64 periodTotalFlush = walsnd->log_ctrl.period_total_flush + newFlush;
    uint64 periodTotalApply = walsnd->log_ctrl.period_total_apply + newApply;

    /* To reduce the speed fluctuation caused by frequent calculation, we calculate the speed every 2s(time_range). */
    TimestampDifference(walsnd->log_ctrl.prev_calculate_time, reply->sendTime, &sec_to_time, &microsec_to_time);
    long calculate_time_diff = sec_to_time * MILLISECONDS_PER_SECONDS +
        microsec_to_time / MILLISECONDS_PER_MICROSECONDS;
    if (calculate_time_diff <= 0) {
        return;
    }

    /*
     * consumeRatePart1 and consumeRatePart2 is based on 7/8 previous_speed(walsnd->log_ctrl.flush_rate or apply_rate)
     * and 1/8 speed_now(newFlush or newApply / millisec_time_diff). To be more precise and keep more decimal point,
     * we expand speed_now by multiply first then divide, which is (8 * previous_speed * 7/8 + speed_now) / 8.
     */
    if ((walsnd->log_ctrl.flush_rate >> SHIFT_SPEED) > 1) {
        if (calculate_time_diff > CALCULATE_INTERVAL_MILLISECOND || IsRtoRpoOverTarget()) {
            walsnd->log_ctrl.flush_rate = LogCtrlCountBigSpeed(walsnd->log_ctrl.flush_rate,
                                                              (uint64)(periodTotalFlush / calculate_time_diff));
            walsnd->log_ctrl.prev_calculate_time = reply->sendTime;
        }
    } else {
        walsnd->log_ctrl.flush_rate = ((newFlush / (uint64)millisec_time_diff) << SHIFT_SPEED);
    }
    if ((walsnd->log_ctrl.apply_rate >> SHIFT_SPEED) > 1) {
        if (calculate_time_diff > CALCULATE_INTERVAL_MILLISECOND || IsRtoRpoOverTarget()) {
            if (newApply != 0) {
                walsnd->log_ctrl.apply_rate = LogCtrlCountBigSpeed(walsnd->log_ctrl.apply_rate,
                                                                  (uint64)(periodTotalApply / calculate_time_diff));
            }
            walsnd->log_ctrl.prev_calculate_time = reply->sendTime;
        }
    } else {
        walsnd->log_ctrl.apply_rate = ((uint64)(newApply / millisec_time_diff) << SHIFT_SPEED);
    }

    if (walsnd->log_ctrl.prev_calculate_time == reply->sendTime) {
        walsnd->log_ctrl.period_total_flush = 0;
        walsnd->log_ctrl.period_total_apply = 0;
    } else {
        walsnd->log_ctrl.period_total_flush = periodTotalFlush;
        walsnd->log_ctrl.period_total_apply = periodTotalApply;
    }
    if (AM_WAL_HADR_DNCN_SENDER && STANDBY_IN_BARRIER_PAUSE) {
        walsnd->log_ctrl.prev_RTO = walsnd->log_ctrl.current_RTO;
        walsnd->log_ctrl.current_RTO = 0;
        g_instance.rto_cxt.rto_standby_data[walsnd->index].current_rto = walsnd->log_ctrl.current_RTO;
        return;
    }

    uint64 flushSpeed = (walsnd->log_ctrl.flush_rate >> SHIFT_SPEED);
    uint64 applySpeed = (walsnd->log_ctrl.apply_rate >> SHIFT_SPEED);
    if (flushSpeed == 0) {
        flushSpeed = 1;
    }

    if (applySpeed == 0) {
        applySpeed = 1;
    }

    uint64 sec_RTO_part1 = (needFlush / flushSpeed) / MILLISECONDS_PER_SECONDS;
    uint64 sec_RTO_part2 = ((needFlush + needApply) / applySpeed) / MILLISECONDS_PER_SECONDS;
    uint64 sec_RTO = sec_RTO_part1 > sec_RTO_part2 ? sec_RTO_part1 : sec_RTO_part2;
    walsnd->log_ctrl.prev_RTO = walsnd->log_ctrl.current_RTO;
    walsnd->log_ctrl.current_RTO = sec_RTO;

    g_instance.rto_cxt.rto_standby_data[walsnd->index].current_rto = walsnd->log_ctrl.current_RTO;
    ereport(DEBUG4, (errmodule(MOD_RTO_RPO),
                     errmsg("The RTO estimated is = : %lu seconds. reply->reveive is %lu, reply->flush is %lu, "
                            "reply->apply is %lu, pre_flush is %lu, pre_apply is %lu, TimestampDifference is %ld, "
                            "flushSpeed is %lu, applySpeed is %lu, flush_sec is %ld ms, apply_sec is %ld ms",
                            sec_RTO, reply->receive, reply->flush, reply->apply, walsnd->log_ctrl.prev_flush,
                            walsnd->log_ctrl.prev_apply, millisec_time_diff, flushSpeed, applySpeed,
                            needFlush / flushSpeed, (needFlush + needApply) / applySpeed)));
}

#ifndef ENABLE_LITE_MODE
/* Calculate the RTO and RPO changes and control the changes as long as one changes. */
static void LogCtrlCalculateIndicatorChange(int64 *gapDiff, int64 *gap, bool *isEagerMode, const bool isHadrRPO)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

    if (isHadrRPO) {
        int targetRPO = u_sess->attr.attr_storage.hadr_recovery_point_target / 2;
        if (walsnd->log_ctrl.prev_RPO < 0) {
            walsnd->log_ctrl.prev_RPO = walsnd->log_ctrl.current_RPO;
        }

        *gap = walsnd->log_ctrl.current_RPO - targetRPO;
        *gapDiff = walsnd->log_ctrl.current_RPO - walsnd->log_ctrl.prev_RPO;
        *isEagerMode = walsnd->log_ctrl.current_RPO > u_sess->attr.attr_storage.hadr_recovery_point_target ||
            walsnd->log_ctrl.current_RPO <= 1;
    } else {
        int targetRTO = 0;
        if ((AM_WAL_HADR_DNCN_SENDER || AM_WAL_SHARE_STORE_SENDER) &&
            u_sess->attr.attr_storage.hadr_recovery_time_target) {
            targetRTO = u_sess->attr.attr_storage.hadr_recovery_time_target / 2;
            *isEagerMode = walsnd->log_ctrl.current_RTO > u_sess->attr.attr_storage.hadr_recovery_time_target ||
                walsnd->log_ctrl.current_RTO <= 1;
        } else if (!(AM_WAL_HADR_DNCN_SENDER || AM_WAL_SHARE_STORE_SENDER) &&
            u_sess->attr.attr_storage.target_rto > 0) {
            targetRTO = u_sess->attr.attr_storage.target_rto / 2;
            *isEagerMode = walsnd->log_ctrl.current_RTO > u_sess->attr.attr_storage.target_rto ||
                walsnd->log_ctrl.current_RTO <= 1;
        } else {
            ereport(WARNING,
                (errmsg("[CalculateIndicatorChange] got the wrong targetRTO, target_rto is %d, "
                "hadr_recovery_time_target is %d, hadr_recovery_point_target is %d",
                u_sess->attr.attr_storage.target_rto, u_sess->attr.attr_storage.hadr_recovery_time_target,
                u_sess->attr.attr_storage.hadr_recovery_point_target)));
        }
        if (walsnd->log_ctrl.prev_RTO < 0) {
            walsnd->log_ctrl.prev_RTO = walsnd->log_ctrl.current_RTO;
        }
        *gap = walsnd->log_ctrl.current_RTO - targetRTO;
        *gapDiff = walsnd->log_ctrl.current_RTO - walsnd->log_ctrl.prev_RTO;
    }
    ereport(DEBUG4, (errmodule(MOD_RTO_RPO),
                        errmsg("[CalculateIndicatorChange] gap=%d, gap_diff=%d,"
                            "isEagerMode=%d, isHadrRPO=%d",
                            (int)*gap, (int)*gapDiff,(int)*isEagerMode, (int)isHadrRPO)));

}

static void LogCtrlTreatNoDataSend(int64 *sleepTime)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    if (walsnd->log_ctrl.prev_send_time > 0 && ComputeTimeStamp(walsnd->log_ctrl.prev_send_time)
        > (MILLISECONDS_PER_SECONDS * 3)) {
        *sleepTime -= SLEEP_LESS * EAGER_MODE_MULTIPLE;
        *sleepTime = (*sleepTime >= 0) ? *sleepTime : 0;
        ereport(DEBUG4, (errmodule(MOD_RTO_RPO),
            errmsg("Walsender send data interval more than 3s, sleep time reduced to: %ld ", *sleepTime)));
    }
}
#endif

/*
 * If current RTO/RPO is less than target_rto/time_to_target_rpo, primary need less sleep.
 * If current RTO/RPO is more than target_rto/time_to_target_rpo, primary need more sleep.
 * If current RTO/RPO equals to target_rto/time_to_target_rpo, primary will sleep
 * according to balance_sleep to maintain rto.
 */
static void LogCtrlCalculateSleepTime(int64 logCtrlSleepTime, int64 balanceSleepTime, const bool isHadrRPO)
{
#ifndef ENABLE_LITE_MODE
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    int addLevel;
    int reduceLevel;

    /* use for rto log */
    int64 pre_time = logCtrlSleepTime;

    /* Range to allow rto/rpo to fluctuate up and down the target/2 */
    int balance_range = 1;
    const int NEEDS_LARGER_RANGE = 60;
    if (isHadrRPO) {
        addLevel = SLEEP_MORE / EAGER_MODE_MULTIPLE;
        reduceLevel = SLEEP_LESS / EAGER_MODE_MULTIPLE;
    } else {
        addLevel = SLEEP_MORE;
        reduceLevel = SLEEP_LESS;
        if (AM_WAL_HADR_DNCN_SENDER && u_sess->attr.attr_storage.hadr_recovery_time_target >= NEEDS_LARGER_RANGE) {
            balance_range = 2;
        } else if(!AM_WAL_HADR_DNCN_SENDER && u_sess->attr.attr_storage.target_rto >= NEEDS_LARGER_RANGE) {
            balance_range = 2;
        }
        LogCtrlTreatNoDataSend(&logCtrlSleepTime);
    }
    int64 sleepTime = logCtrlSleepTime;
    int64 gapDiff;
    int64 gap;
    bool isEagerMode = false;
    LogCtrlCalculateIndicatorChange(&gapDiff, &gap, &isEagerMode, isHadrRPO);

    /* mark balance sleep time */
    if (abs(gapDiff) <= 1) {
        if (balanceSleepTime == 0) {
            balanceSleepTime = sleepTime;
        } else {
            balanceSleepTime = (int64)LogCtrlCountBigSpeed((uint64)balanceSleepTime, (uint64)sleepTime >> SHIFT_SPEED);
        }
        if (isHadrRPO) {
            ereport(DEBUG4, (errmodule(MOD_RTO_RPO),
                            errmsg("The RPO balance time for log control is : %ld microseconds", balanceSleepTime)));
        } else {
            ereport(DEBUG4, (errmodule(MOD_RTO_RPO),
                             errmsg("The RTO balance time for log control is : %ld microseconds", balanceSleepTime)));
        }
    }

    /* rto balance, currentRTO close to targetRTO */
    if (abs(gap) <= balance_range && !isEagerMode) {
        if (balanceSleepTime != 0) {
            logCtrlSleepTime = balanceSleepTime;
        } else if (gapDiff < 0) {
            sleepTime -= reduceLevel;
            logCtrlSleepTime = (sleepTime >= 0) ? sleepTime : 0;
        } else {
            sleepTime += addLevel;
            logCtrlSleepTime = (sleepTime < 1 * MICROSECONDS_PER_SECONDS) ? sleepTime : MICROSECONDS_PER_SECONDS;
        }
    }

    /* need more sleep, currentRTO larger than targetRTO
     *  get bigger, but no more than 1s
     */
    if (gap > balance_range) {
        if (isEagerMode) {
            sleepTime += addLevel * EAGER_MODE_MULTIPLE;
        } else if (gapDiff > 0) {
            sleepTime += addLevel;
        }
        logCtrlSleepTime = (sleepTime < 1 * MICROSECONDS_PER_SECONDS) ? sleepTime : MICROSECONDS_PER_SECONDS;
    }

    /* need less sleep, currentRTO less than targetRTO */
    if (gap < -balance_range) {
        if (isEagerMode) {
            sleepTime -= (balanceSleepTime == 0) ? sleepTime : reduceLevel * EAGER_MODE_MULTIPLE;
        } else if (gapDiff < 0) {
            sleepTime -= reduceLevel;
        }
        logCtrlSleepTime = (sleepTime >= 0) ? sleepTime : 0;
    }

    int targetRTO = 0;
    if (AM_WAL_HADR_DNCN_SENDER || AM_WAL_SHARE_STORE_SENDER) {
        targetRTO = u_sess->attr.attr_storage.hadr_recovery_time_target;
    } else {
        targetRTO = u_sess->attr.attr_storage.target_rto;
    }
    /* log control take effect */
    if (pre_time == 0 && logCtrlSleepTime != 0) {
        if (isHadrRPO) {
            ereport(LOG,
                (errmodule(MOD_RTO_RPO),
                errmsg("Log control take effect due to RPO, target_rpo is %d, current_rpo is %ld, "
                       "current the sleep time is %ld microseconds",
                       u_sess->attr.attr_storage.hadr_recovery_point_target,
                       walsnd->log_ctrl.current_RPO, logCtrlSleepTime)));
        } else {
            ereport(LOG,
                (errmodule(MOD_RTO_RPO),
                errmsg("Log control take effect due to RTO, target_rto is %d, current_rto is %ld, "
                       "current the sleep time is %ld microseconds",
                       targetRTO, walsnd->log_ctrl.current_RTO, logCtrlSleepTime)));
        }
    }
    /* log control take does not effect */
    if (pre_time != 0 && logCtrlSleepTime == 0) {
        if (isHadrRPO) {
            ereport(LOG,
                (errmodule(MOD_RTO_RPO),
                errmsg("Log control does not take effect due to RPO, target_rpo is %d, current_rpo is %ld, "
                       "current the sleep time is %ld microseconds",
                       u_sess->attr.attr_storage.hadr_recovery_point_target,
                       walsnd->log_ctrl.current_RPO, logCtrlSleepTime)));
        } else {
            ereport(LOG,
                (errmodule(MOD_RTO_RPO),
                errmsg("Log control does not take effect because of RTO, target_rto is %d, current_rto is %ld, "
                       "current the sleep time is %ld microseconds",
                       targetRTO, walsnd->log_ctrl.current_RTO, logCtrlSleepTime)));
        }
    }
    /* return the value and print debug log */
    if (isHadrRPO) {
        g_instance.streaming_dr_cxt.rpoSleepTime = logCtrlSleepTime;
        g_instance.streaming_dr_cxt.rpoBalanceSleepTime = balanceSleepTime;
        ereport(DEBUG4, (errmodule(MOD_RTO_RPO),
            errmsg("The RPO sleep time for log control is : %ld microseconds, current RPO is : %ld",
                logCtrlSleepTime, walsnd->log_ctrl.current_RPO)));
    } else {
        walsnd->log_ctrl.sleep_time = logCtrlSleepTime;
        walsnd->log_ctrl.balance_sleep_time = balanceSleepTime;
        ereport(DEBUG4, (errmodule(MOD_RTO_RPO),
            errmsg("The RTO sleep time for log control is : %ld microseconds, current RTO is : %ld",
                logCtrlSleepTime, walsnd->log_ctrl.current_RTO)));
    }
#else
    FEATURE_ON_LITE_MODE_NOT_SUPPORTED();
#endif
}

static void LogCtrlCalculateCurrentRPO(StandbyReplyMessage *reply)
{
#ifndef ENABLE_LITE_MODE
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    XLogRecPtr receivePtr;
    XLogRecPtr writePtr;
    XLogRecPtr flushPtr;
    XLogRecPtr replayPtr;
    bool got_recptr = false;
    bool amSync = false;
    long sec_to_time;
    int microsec_to_time;

    if (AM_WAL_HADR_CN_SENDER) {
        flushPtr = GetFlushRecPtr();
    } else if (AM_WAL_SHARE_STORE_SENDER) {
        if (SS_REPLICATION_DORADO_CLUSTER) {
            flushPtr = g_instance.xlog_cxt.ssReplicationXLogCtl->insertHead;
        } else {
            flushPtr = g_instance.xlog_cxt.shareStorageXLogCtl->insertHead;
        }
    } else {
        got_recptr = SyncRepGetSyncRecPtr(&receivePtr, &writePtr, &flushPtr, &replayPtr, &amSync, false);
        if (got_recptr != true) {
            ereport(WARNING,
                (errmsg("In disaster mode, calculate standby cluster RPO failed because could not got main cluster "
                        "flush location")));
            return;
        }
    }
    if (XLByteLT(flushPtr, reply->flush) || XLByteLT(reply->flush, walsnd->log_ctrl.prev_flush)) {
        return;
    }
    if (XLByteEQ(flushPtr, reply->flush)) {
        walsnd->log_ctrl.prev_RPO = walsnd->log_ctrl.current_RPO;
        walsnd->log_ctrl.current_RPO = 0;
        return;
    }

    if (walsnd->log_ctrl.prev_reply_time == 0) {
        return;
    }
    TimestampDifference(walsnd->log_ctrl.prev_reply_time, reply->sendTime, &sec_to_time, &microsec_to_time);
    long millisec_time_diff = sec_to_time * MILLISECONDS_PER_SECONDS +
        microsec_to_time / MILLISECONDS_PER_MICROSECONDS;
    if (millisec_time_diff <= 100) {
        return;
    }

    uint64 needFlush = flushPtr - reply->flush;
    uint64 newFlush = reply->flush - walsnd->log_ctrl.prev_flush;

    if ((walsnd->log_ctrl.local_flush_rate >> SHIFT_SPEED) > 1) {
        walsnd->log_ctrl.local_flush_rate = LogCtrlCountBigSpeed(walsnd->log_ctrl.local_flush_rate,
                                                          (uint64)(newFlush / millisec_time_diff));
    } else {
        walsnd->log_ctrl.local_flush_rate = ((newFlush / (uint64)millisec_time_diff) << SHIFT_SPEED);
    }

    uint64 consumeRatePart = (walsnd->log_ctrl.local_flush_rate >> SHIFT_SPEED);
    if (consumeRatePart == 0) {
        consumeRatePart = 1;
    }
    walsnd->log_ctrl.prev_RPO = walsnd->log_ctrl.current_RPO;
    walsnd->log_ctrl.current_RPO = (needFlush / consumeRatePart) / MILLISECONDS_PER_SECONDS;
    ereport(DEBUG4, (errmodule(MOD_RTO_RPO),
                    errmsg("The RPO estimated is = : %ld seconds. local flush is %lu, reply->flush is %lu, "
                           "prev_flush is %lu, TimestampDifference is %ld, "
                           "consumeRatePart is %lu, RPO millisecond is %ld",
                           walsnd->log_ctrl.current_RPO, flushPtr, reply->flush, walsnd->log_ctrl.prev_flush,
                           millisec_time_diff, consumeRatePart, needFlush / consumeRatePart)));
#else
    FEATURE_ON_LITE_MODE_NOT_SUPPORTED();
#endif
}

#ifdef ENABLE_MULTIPLE_NODES
static void LogCtrlCalculateHadrCurrentRPO(void)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    int64 targetBarrierTimeStamp;
    int64 currentBarrierTimeStamp;
    int64 timeDiff;
    errno_t errorno = EOK;
    char targetBarrierId[MAX_BARRIER_ID_LENGTH];
    char currentBarrierId[MAX_BARRIER_ID_LENGTH];

    SpinLockAcquire(&g_instance.streaming_dr_cxt.mutex);
    errorno = strncpy_s((char *)targetBarrierId, MAX_BARRIER_ID_LENGTH,
        (char *)g_instance.streaming_dr_cxt.targetBarrierId, MAX_BARRIER_ID_LENGTH);
    securec_check(errorno, "\0", "\0");
    errorno = strncpy_s((char *)currentBarrierId, MAX_BARRIER_ID_LENGTH,
        (char *)g_instance.streaming_dr_cxt.currentBarrierId, MAX_BARRIER_ID_LENGTH);
    securec_check(errorno, "\0", "\0");
    SpinLockRelease(&g_instance.streaming_dr_cxt.mutex);

    if (!IS_CSN_BARRIER(currentBarrierId) || !IS_CSN_BARRIER(targetBarrierId)) {
        return;
    }

    if (IsSwitchoverBarrier(targetBarrierId)) {
        walsnd->log_ctrl.prev_RPO = walsnd->log_ctrl.current_RPO;
        walsnd->log_ctrl.current_RPO = 0;
        return;
    }

    targetBarrierTimeStamp = CsnBarrierNameGetTimeStamp(targetBarrierId);
    currentBarrierTimeStamp = CsnBarrierNameGetTimeStamp(currentBarrierId);
    if (targetBarrierTimeStamp == 0 || currentBarrierTimeStamp == 0) {
        ereport(WARNING,
            (errmsg("[HADR_RPO] get barrierName failure, targetBarrierId: %s, currentBarrierId: %s",
            targetBarrierId, currentBarrierId)));
        return;
    }
    timeDiff = currentBarrierTimeStamp - targetBarrierTimeStamp;
    if (timeDiff < 0) {
        timeDiff = 0;
    }
    walsnd->log_ctrl.prev_RPO = walsnd->log_ctrl.current_RPO;
    walsnd->log_ctrl.current_RPO = timeDiff / MILLISECONDS_PER_SECONDS;
    ereport(DEBUG4, (errmodule(MOD_RTO_RPO),
                    errmsg("The RPO estimated is = : %ld seconds. targetBarrierId: %s, currentBarrierId: %s, "
                           "RPO millisecond is %ld",
                           walsnd->log_ctrl.current_RPO, targetBarrierId, currentBarrierId, timeDiff)));
}
#endif

static void ChooseStartPointForDummyStandby(void)
{
    XLogRecPtr initSentPtr;

    if (!XLByteEQ(t_thrd.walsender_cxt.sentPtr, InvalidXLogRecPtr)) {
        ereport(DEBUG1, (errmsg("use current sentPtr %X/%X as sync secondary startpoint",
                                (uint32)(t_thrd.walsender_cxt.sentPtr >> 32), (uint32)t_thrd.walsender_cxt.sentPtr)));
        return;
    }

    t_thrd.xlog_cxt.server_mode = PRIMARY_MODE;
    ReplicationSlotsComputeRequiredLSN(NULL);
    initSentPtr = XLogGetReplicationSlotMaximumLSN();

    ReplicationSlotReportRestartLSN();
    ereport(LOG, (errmsg("init sentPtr at %X/%X, latestValidRecord is %X/%X", (uint32)(initSentPtr >> 32),
                         (uint32)initSentPtr, (uint32)(latestValidRecord >> 32), (uint32)latestValidRecord)));

    if (XLByteEQ(initSentPtr, InvalidXLogRecPtr))
        initSentPtr = latestValidRecord;

    /*
     * Ref RequestXLogStreaming()
     * We always start at the beginning of the segment. That prevents a broken
     * segment (i.e., with no records in the first half of a segment) from
     * being created by XLOG streaming, which might cause trouble later on if
     * the segment is e.g archived.
     * Prev the requested segment if request xlog from the beginning of a segment.
     */
    if (initSentPtr % XLogSegSize != 0) {
        initSentPtr -= initSentPtr % XLogSegSize;
    } else {
        XLogSegNo _logSeg;
        XLByteToSeg(initSentPtr, _logSeg);
        _logSeg--;
        initSentPtr = _logSeg * XLogSegSize;
    }

    t_thrd.walsender_cxt.sentPtr = MAX_XLOG_RECORD(t_thrd.walsender_cxt.sentPtr, initSentPtr);

    ereport(
        DEBUG2,
        (errmsg(
            "In ChooseStartPointForDummyStandby(): initSentPtr is %X/%X, latestValidRecord is %X/%X, sentPtr is %X/%X.",
            (uint32)(initSentPtr >> 32), (uint32)initSentPtr, (uint32)(latestValidRecord >> 32),
            (uint32)latestValidRecord, (uint32)(t_thrd.walsender_cxt.sentPtr >> 32),
            (uint32)t_thrd.walsender_cxt.sentPtr)));
}
static int WSXLogPageRead(XLogReaderState *xlogreader, XLogRecPtr targetPagePtr, int reqLen, XLogRecPtr targetRecPtr,
                          char *readBuf, TimeLineID *pageTLI, char* xlog_path = NULL)
{
    WSXLogPageReadPrivate *ws_private = (WSXLogPageReadPrivate *)xlogreader->private_data;
    uint32 targetPageOff;
    int nRetCode = 0;
    char xlogfile[MAXFNAMELEN];
    char xlogfpath[MAXPGPATH];

    if (ws_private == NULL) {
        Assert(false);
        ereport(WARNING, (errmsg("The WAL Streaming XLog Reader Private Info is NULL.")));
        return -1;
    }

    if (ws_private->xlogreadfd >= 0 && !XLByteInSeg(targetPagePtr, ws_private->xlogreadlogsegno)) {
        (void)close(ws_private->xlogreadfd);
        ws_private->xlogreadfd = -1;
    }

    XLByteToSeg(targetPagePtr, ws_private->xlogreadlogsegno);

    if (ws_private->xlogreadfd < 0) {
        XLogFileName(xlogfile, MAXFNAMELEN, ws_private->tli, ws_private->xlogreadlogsegno);

        nRetCode = snprintf_s(xlogfpath, MAXPGPATH, MAXPGPATH - 1, XLOGDIR "/%s", xlogfile);
        securec_check_ss(nRetCode, "\0", "\0");

        ws_private->xlogreadfd = BasicOpenFile(xlogfpath, O_RDONLY | PG_BINARY, 0);

        if (ws_private->xlogreadfd < 0) {
            ereport(DEBUG2, (errmsg("could not open the xlog file %s: %s.", xlogfpath, gs_strerror(errno))));
            return -1;
        }
    }

    targetPageOff = targetPagePtr % XLogSegSize;

    /* Read the requested page */
    if (lseek(ws_private->xlogreadfd, (off_t)targetPageOff, SEEK_SET) < 0) {
        Assert(false);
        ereport(WARNING,
                (errmsg("could not seek %u bytes in the file %s: %s.", targetPageOff, xlogfpath, gs_strerror(errno))));
        return -1;
    }

    if (read(ws_private->xlogreadfd, readBuf, XLOG_BLCKSZ) != XLOG_BLCKSZ) {
        Assert(false);
        ereport(WARNING, (errmsg("could not read the request %d bytes in the xlog file %s: %s.", reqLen, xlogfpath,
                                 gs_strerror(errno))));
        return -1;
    }

    *pageTLI = ws_private->tli;
    return XLOG_BLCKSZ;
}

static void InitWalSndXLogReader()
{
    WSXLogPageReadPrivate *ws_private = NULL;
    errno_t rc = 0;

    if (t_thrd.walsender_cxt.ws_xlog_reader) {
        if (t_thrd.walsender_cxt.ws_xlog_reader->private_data) {
            pfree((WSXLogPageReadPrivate *)t_thrd.walsender_cxt.ws_xlog_reader->private_data);
            t_thrd.walsender_cxt.ws_xlog_reader->private_data = NULL;
        }

        XLogReaderFree(t_thrd.walsender_cxt.ws_xlog_reader);
        t_thrd.walsender_cxt.ws_xlog_reader = NULL;
    }

    /*
     * Allocate the xlogreader used for xlog parsing.
     */
    ws_private = (WSXLogPageReadPrivate *)palloc(sizeof(WSXLogPageReadPrivate));

    /* Set up XLOG reader facility */
    rc = memset_s(ws_private, sizeof(WSXLogPageReadPrivate), 0, sizeof(WSXLogPageReadPrivate));
    securec_check(rc, "\0", "\0");
    ws_private->xlogreadfd = -1;
    ws_private->tli = t_thrd.xlog_cxt.ThisTimeLineID;

    t_thrd.walsender_cxt.ws_xlog_reader = XLogReaderAllocate(&WSXLogPageRead, ws_private);

    if (!t_thrd.walsender_cxt.ws_xlog_reader)
        ereport(ERROR, (errcode(ERRCODE_INVALID_STATUS), errmsg("Failed to init the xlog reader for the wal sender.")));
    else
        ereport(LOG, (errmsg("Succeeded to init the xlog reader for the wal sender.")));

    return;
}

static void WSDataSendInit()
{
    /*
     * Allocate buffer that will be used for each output message.  We do this
     * just once to reduce palloc overhead.  The buffer must be made large
     * enough for maximum-sized messages.
     */
    if (!g_instance.attr.attr_storage.enable_mix_replication) {
        t_thrd.walsender_cxt.output_xlog_message =
            (char *)palloc(1 + sizeof(WalDataMessageHeader) + (int)WS_MAX_SEND_SIZE);
        if (BBOX_BLACKLIST_XLOG_MESSAGE_SEND) {
            bbox_blacklist_add(XLOG_MESSAGE_SEND, t_thrd.walsender_cxt.output_xlog_message,
                               1 + sizeof(WalDataMessageHeader) + (int)WS_MAX_SEND_SIZE);
        }
    } else {
        t_thrd.walsender_cxt.output_xlog_msg_prefix_len = 1 + sizeof(WalDataMessageHeader) + sizeof(uint32) + 1 +
                                                          sizeof(XLogRecPtr);
        t_thrd.walsender_cxt.output_xlog_message =
            (char *)palloc(t_thrd.walsender_cxt.output_xlog_msg_prefix_len + (int)WS_MAX_SEND_SIZE);
        t_thrd.walsender_cxt.output_data_message = (char *)palloc(
            1 + sizeof(WalDataPageMessageHeader) + sizeof(uint32) + 1 + sizeof(XLogRecPtr) * 2 + (int)WS_MAX_SEND_SIZE);
        t_thrd.walsender_cxt.output_data_msg_cur_len = 0;
        t_thrd.walsender_cxt.load_cu_buffer = (char *)palloc(t_thrd.walsender_cxt.load_cu_buffer_size);

        InitWalSndXLogReader();

        t_thrd.walsender_cxt.wsXLogJustSendRegion->start_ptr = InvalidXLogRecPtr;
        t_thrd.walsender_cxt.wsXLogJustSendRegion->end_ptr = InvalidXLogRecPtr;

        if (BBOX_BLACKLIST_XLOG_MESSAGE_SEND) {
            bbox_blacklist_add(XLOG_MESSAGE_SEND, t_thrd.walsender_cxt.output_xlog_message,
                               t_thrd.walsender_cxt.output_xlog_msg_prefix_len + (int)WS_MAX_SEND_SIZE);
        }
    }

    return;
}

/* Main loop of walsender process */
static int WalSndLoop(WalSndSendDataCallback send_data)
{
    bool first_startup = true;
    bool sync_config_needed = false;
    bool marked_stream_replication = true;
    TimestampTz last_syncconf_timestamp;

    WSDataSendInit();

    /*
     * Allocate buffer that will be used for processing reply messages.  As
     * above, do this just once to reduce palloc overhead.
     */
    initStringInfo(t_thrd.walsender_cxt.reply_message);
    initStringInfo(t_thrd.walsender_cxt.tmpbuf);

    /* Initialize the last reply timestamp */
    t_thrd.walsender_cxt.last_reply_timestamp = GetCurrentTimestamp();
    last_syncconf_timestamp = GetCurrentTimestamp();
    t_thrd.walsender_cxt.last_logical_xlog_advanced_timestamp = GetCurrentTimestamp();
    t_thrd.walsender_cxt.last_logical_slot_advanced_timestamp = GetCurrentTimestamp();
    t_thrd.walsender_cxt.waiting_for_ping_response = false;
#define MINUTE_30 (30 * 60 * 1000) /* 30 minutes */
    t_thrd.walsender_cxt.timeoutCheckInternal = u_sess->attr.attr_storage.wal_sender_timeout;
    if (strcmp(u_sess->attr.attr_common.application_name, "gs_probackup") == 0 &&
        t_thrd.walsender_cxt.timeoutCheckInternal < MINUTE_30) {
        t_thrd.walsender_cxt.timeoutCheckInternal = MINUTE_30;
    }

    ResourceOwner tmpOwner = t_thrd.utils_cxt.CurrentResourceOwner;
    Assert(!IsTransactionOrTransactionBlock() &&
        strcmp(ResourceOwnerGetName(tmpOwner), "walsender top-level resource owner") == 0);
    /* Loop forever, unless we get an error */
    for (;;) {
        t_thrd.utils_cxt.CurrentResourceOwner = tmpOwner;
        TimestampTz now;

        /* Clear any already-pending wakeups */
        ResetLatch(&t_thrd.walsender_cxt.MyWalSnd->latch);
#ifdef ENABLE_DISTRIBUTE_TEST
        if (TEST_STUB(DN_WALSEND_MAINLOOP, stub_sleep_emit)) {
            ereport(get_distribute_test_param()->elevel,
                    (errmsg("sleep_emit happen during WalSndLoop  time:%ds, stub_name:%s",
                            get_distribute_test_param()->sleep_time, get_distribute_test_param()->test_stub_name)));
        }
#endif

        pgstat_report_activity(STATE_RUNNING, NULL);

        /*
         * Emergency bailout if postmaster has died.  This is to avoid the
         * necessity for manual cleanup of all postmaster children.
         */
        if (!PostmasterIsAlive())
            gs_thread_exit(1);

        /* Process any requests or signals received recently */
        if (t_thrd.walsender_cxt.got_SIGHUP) {
            t_thrd.walsender_cxt.got_SIGHUP = false;
            marked_stream_replication = u_sess->attr.attr_storage.enable_stream_replication;
            ProcessConfigFile(PGC_SIGHUP);
            SyncRepInitConfig();
#ifndef ENABLE_MULTIPLE_NODES
            if (g_instance.attr.attr_common.sync_config_strategy == ALL_NODE ||
                (g_instance.attr.attr_common.sync_config_strategy == ONLY_SYNC_NODE &&
                t_thrd.walsender_cxt.MyWalSnd->sync_standby_priority > 0)) {
                sync_config_needed = true;
            } else {
                sync_config_needed = false;
            }
#else
            sync_config_needed = true;
#endif
        }

        ArchiveXlogMessage *archive_message = NULL;
        archive_message = get_archive_task_from_list();
        if (unlikely(archive_message != NULL)) {
            WalSndArchiveXlog(archive_message);
        }

        /* switchover is forbidden when catchup thread in progress */
        if (catchup_online && t_thrd.walsender_cxt.WalSndCtl->demotion > NoDemote) {
            volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
            SpinLockAcquire(&t_thrd.walsender_cxt.WalSndCtl->mutex);

            walsnd->node_state = NODESTATE_PRIMARY_DEMOTING_WAIT_CATCHUP;
            WalSndResponseSwitchover(t_thrd.walsender_cxt.output_xlog_message);

            /* recover node_state and demotion state */
            walsnd->node_state = NODESTATE_NORMAL;
            t_thrd.walsender_cxt.WalSndCtl->demotion = NoDemote;
            t_thrd.walsender_cxt.Demotion = NoDemote;

            SpinLockRelease(&t_thrd.walsender_cxt.WalSndCtl->mutex);

            ereport(PANIC,
                    (errmsg("walsender stop switchover process for catchup is alive, the process need to be restart")));
        }

        /* Normal exit from the walsender is here */
        if ((t_thrd.walsender_cxt.walsender_shutdown_requested &&
             !t_thrd.walsender_cxt.response_switchover_requested) ||
            t_thrd.walsender_cxt.MyWalSnd->node_state == NODESTATE_STANDBY_REDIRECT) {
            /* Inform the standby that XLOG streaming is done */
            if (!sync_config_needed) {
                pq_puttextmessage('C', "COPY 0");
                (void)pq_flush();

                proc_exit(0);
            }
        }

        /*
         * In the scenario where the stream replication connection is set to standby connection,
         * if the role is the primary, disconnect the connection.
         * This is to avoid the decoding thread occupying the primary resources.
         */
        if (t_thrd.walsender_cxt.standbyConnection == true && PMstateIsRun()) {
            ereport(ERROR, (errmsg("walsender closed because of role is primary.")));
        }

        /* if changed to stream replication, request for catchup. */
        if (u_sess->attr.attr_storage.enable_stream_replication && !marked_stream_replication) {
            marked_stream_replication = u_sess->attr.attr_storage.enable_stream_replication;
            WalSndSetState(WALSNDSTATE_CATCHUP);
        }

        if (t_thrd.walsender_cxt.response_switchover_requested) {
            if (t_thrd.walsender_cxt.MyWalSnd->peer_role != STANDBY_MODE) {
                ereport(LOG, (errmsg("walsender closed because of switchover.")));
                proc_exit(0);
            }
        }

        /* Check for input from the client */
        ProcessRepliesIfAny();

        /* Walsender first startup, send a keepalive to standby, no need reply. */
        if (first_startup) {
            WalSndKeepalive(false);
            first_startup = false;
        }

        /* send switchover response message to standby if requested */
        if (t_thrd.walsender_cxt.response_switchover_requested) {
            XLogRecPtr WriteRqstPtr;
            uint32 XLogPageOffSet;

            WriteRqstPtr = GetXLogInsertEndRecPtr();
            XLogPageOffSet = WriteRqstPtr % XLOG_BLCKSZ;

            ereport(LOG, (errmsg("The WAL sender in primary is ready to do the switchover.")));

            ereport(LOG,
                    (errmsg("the latest WAL insert at %X/%X", (uint32)(WriteRqstPtr >> 32), (uint32)WriteRqstPtr)));

            /*
             * Check whether the write requestptr points to the end of new
             * page header, we try to flush to the end of last page instead
             * of the new page header.
             */
            if (SizeOfXLogLongPHD == XLogPageOffSet || SizeOfXLogShortPHD == WriteRqstPtr % XLogSegSize) {
                WriteRqstPtr -= XLogPageOffSet;
                ereport(LOG, (errmsg("the latest WAL insert back off to %X/%X", (uint32)(WriteRqstPtr >> 32),
                                     (uint32)WriteRqstPtr)));
            }

            /*
             * Do a last xlog flush; then, if XLogNeedsFlush() found useful
             * work to do, continue to loop.
             */
            if (XLogNeedsFlush(WriteRqstPtr)) {
                XLogWaitFlush(WriteRqstPtr);
                ereport(LOG,
                        (errmsg("the latest WAL flush to %X/%X.", (uint32)(WriteRqstPtr >> 32), (uint32)WriteRqstPtr)));
            } else {
                XLogRecPtr SendRqstPtr;
                SendRqstPtr = AM_WAL_STANDBY_SENDER ? GetStandbyFlushRecPtr(NULL) : GetFlushRecPtr();
                /* Quick exit if nothing to do */
                if (XLByteLE(SendRqstPtr, t_thrd.walsender_cxt.MyWalSnd->flush) &&
                    !t_thrd.walsender_cxt.wal_send_completed) {
                    t_thrd.walsender_cxt.wal_send_completed = true;
                    ereport(LOG, (errmsg("the latest WAL complete at %X/%X", (uint32)(SendRqstPtr >> 32),
                                         (uint32)SendRqstPtr)));
                } else
                    ereport(LOG, (errmsg("the latest WAL flush at %X/%X the latest standby flush at %X/%X",
                                         (uint32)(SendRqstPtr >> 32), (uint32)SendRqstPtr,
                                         (uint32)(t_thrd.walsender_cxt.MyWalSnd->flush >> 32),
                                         (uint32)t_thrd.walsender_cxt.MyWalSnd->flush)));

                if (!DataSndInProgress(SNDROLE_PRIMARY_STANDBY | SNDROLE_PRIMARY_DUMMYSTANDBY) &&
                    !WalSndInProgress(SNDROLE_PRIMARY_DUMMYSTANDBY | SNDROLE_PRIMARY_STANDBY) &&
                    t_thrd.walsender_cxt.wal_send_completed) {
                    t_thrd.walsender_cxt.response_switchover_requested = false;
                    WalSndResponseSwitchover(t_thrd.walsender_cxt.output_xlog_message);
                    ereport(
                        LOG,
                        (errmsg(
                            "The WAL sender in primary has done the switchover waiting for the standby's promotion.")));
                }
            }
        }
        if (sync_config_needed) {
            if (t_thrd.walsender_cxt.walsender_shutdown_requested) {
                if (!AM_WAL_DB_SENDER && !SendConfigFile(t_thrd.walsender_cxt.gucconf_file))
                    ereport(LOG, (errmsg("failed to send config to the peer when walsender shutdown.")));
                sync_config_needed = false;
            } else {
                TimestampTz nowtime = GetCurrentTimestamp();
                if (TimestampDifferenceExceeds(last_syncconf_timestamp, nowtime, 1000) ||
                    last_syncconf_timestamp > nowtime) {
                    sync_config_needed = false;
                    /* begin send file to standby */
                    if (t_thrd.walsender_cxt.MyWalSnd && t_thrd.walsender_cxt.MyWalSnd->peer_state != BUILDING_STATE) {
                        if (!AM_WAL_DB_SENDER && !SendConfigFile(t_thrd.walsender_cxt.gucconf_file))
                            sync_config_needed = true;
                        else
                            last_syncconf_timestamp = nowtime;
                    } else {
                        sync_config_needed = false;
                        ereport(LOG, (errmsg("receive sigup,but the peer is building!")));
                    }
                }
            }
        }

        if (AmWalSenderToDummyStandby()) {
            /*
             * If i am sender to dummy and streaming to standby is online, do not
             * send WAL to dummy. Especially, set WalSndCaughtUp to true, if the dummy
             * sender is "out of work".
             */
            if (WalSndCaughtup()) {
                t_thrd.walsender_cxt.walSndCaughtUp = true;
                t_thrd.walsender_cxt.sentPtr = InvalidXLogRecPtr;

                /* Close open wal file */
                if (t_thrd.walsender_cxt.sendFile >= 0) {
                    (void)close(t_thrd.walsender_cxt.sendFile);
                    t_thrd.walsender_cxt.sendFile = -1;
                }

                if (u_sess->attr.attr_storage.HaModuleDebug) {
                    ereport(LOG, (errmsg("standby is steaming, "
                                         "stop sync to walsender, recycle local data.")));
                }

                /* Notify dummy to cleanup WAL. False means not need response. */
                if (WalSndDummyLEStandby()) {
                    WalSndRmXLog(false);
                }

                /* Set dummy standby replication slot lsn invalid */
                if (g_instance.attr.attr_storage.max_replication_slots > 0)
                    SetDummyStandbySlotLsnInvalid();
            } else {
                ChooseStartPointForDummyStandby();

                if (!pq_is_send_pending()) {
                    send_data();
                } else {
                    t_thrd.walsender_cxt.walSndCaughtUp = false;
                }

                /* Send DummyStandby end message */
                if (t_thrd.walsender_cxt.walSndCaughtUp) {
                    /* Try to flush pending output to the client */
                    if (pq_flush_if_writable() != 0)
                        break;

                    if (!pq_is_send_pending())
                        WalSndSyncDummyStandbyDone(false);
                }
            }
        } else {
            /*
             * If we don't have any pending data in the output buffer, try to send
             * some more.  If there is some, we don't bother to call XLogSend
             * again until we've flushed it ... but we'd better assume we are not
             * caught up.
             */
            LogCtrlSleep();
            if (!pq_is_send_pending())
                send_data();
            else
                t_thrd.walsender_cxt.walSndCaughtUp = false;

            if (t_thrd.walsender_cxt.walSndCaughtUp && dummyStandbyMode) {
                if (!pq_is_send_pending()) {
                    WalSndSyncDummyStandbyDone(false);
                    (void)pq_flush();
                    ereport(LOG, (errmsg("dummystandby wal data replication completed at %X/%X",
                                         (uint32)(t_thrd.walsender_cxt.sentPtr >> 32),
                                         (uint32)t_thrd.walsender_cxt.sentPtr)));
                }
            }
        }
        LogCtrlSleep();
        /* Try to flush pending output to the client */
        if (pq_flush_if_writable() != 0) {
            ereport(LOG, (errmsg("flush return not zero !\n")));
            break;
        }

        /* If nothing remains to be sent right now ... */
        if (t_thrd.walsender_cxt.walSndCaughtUp && !pq_is_send_pending()) {
            /*
             * If we're in catchup state, move to streaming.  This is an
             * important state change for users to know about, since before
             * this point data loss might occur if the primary dies and we
             * need to failover to the standby. The state change is also
             * important for synchronous replication, since commits that
             * started to wait at that point might wait for some time.
             */
            if (t_thrd.walsender_cxt.MyWalSnd->state == WALSNDSTATE_CATCHUP) {
                ereport(DEBUG1, (errmsg("standby \"%s\" has now caught up with primary",
                                        u_sess->attr.attr_common.application_name)));
                WalSndSetState(WALSNDSTATE_STREAMING);
                /* Refresh new state to peer */
                WalSndKeepalive(true);
            }

            t_thrd.walsender_cxt.catchup_threshold = 0;

            /*
             * When SIGUSR2 arrives, we send any outstanding logs up to the
             * shutdown checkpoint record (i.e., the latest record), wait
             * for them to be replicated to the standby, and exit.
             * This may be a normal termination at shutdown, or a promotion,
             * the walsender is not sure which.
             */
            if (t_thrd.walsender_cxt.walsender_ready_to_stop) {
                ereport(LOG, (errmsg("standby ready_to_stop: walSndCaughtUp:%u, pgpending:%u, sentPtr:%lx, flust:%lx",
                    t_thrd.walsender_cxt.walSndCaughtUp, pq_is_send_pending(),
                    t_thrd.walsender_cxt.sentPtr, t_thrd.walsender_cxt.MyWalSnd->flush)));
                /*
                 * Let's just be real sure we're caught up. For dummy sender,
                 * during shutting down, if the sender to standby is in progress,
                 * skip to send outstanding logs.
                 */
                if (AmWalSenderToDummyStandby() && WalSndInProgress(SNDROLE_PRIMARY_STANDBY))
                    ; /* nothing to do */
                else
                    send_data();

                if (t_thrd.walsender_cxt.walSndCaughtUp && !pq_is_send_pending()) {
                    if (dummyStandbyMode ||
                        XLByteEQ(t_thrd.walsender_cxt.sentPtr, t_thrd.walsender_cxt.MyWalSnd->flush))
                        t_thrd.walsender_cxt.walsender_shutdown_requested = true;
                }
                if (IS_SHARED_STORAGE_MODE || SS_REPLICATION_DORADO_CLUSTER) {
                    t_thrd.walsender_cxt.walsender_shutdown_requested = true;
                }
            }
        } else {
            if (t_thrd.walsender_cxt.MyWalSnd->state == WALSNDSTATE_CATCHUP) {
                CalCatchupRate();
            }
        }

        now = GetCurrentTimestamp();

        if (u_sess->proc_cxt.MyDatabaseId != InvalidOid && t_thrd.slot_cxt.MyReplicationSlot != NULL)
            WalSndWriteLogicalAdvanceXLog(now);

        /*
         * We don't block if not caught up, unless there is unsent data
         * pending in which case we'd better block until the socket is
         * write-ready.  This test is only needed for the case where XLogSend
         * loaded a subset of the available data but then pq_flush_if_writable
         * flushed it all --- we should immediately try to send more.
         */
        if (t_thrd.walsender_cxt.walSndCaughtUp || pq_is_send_pending()) {
            long sleeptime;
            int wakeEvents;
            int half_timeout = WalSndTimeout() / 2;

            wakeEvents = WL_LATCH_SET | WL_POSTMASTER_DEATH | WL_SOCKET_READABLE | WL_TIMEOUT;

            sleeptime = WalSndComputeSleeptime(now);

            if (pq_is_send_pending())
                wakeEvents |= WL_SOCKET_WRITEABLE;
            else if (first_startup) {
                /* Walsender first startup, send a keepalive to standby, no need reply. */
                WalSndKeepalive(false);
                first_startup = false;
            }

            /*
             * if requested to response switchover, walsender need not to wait for new xlog data.
             * if requested to shutdown, walsender need not to wait for new xlog data.
             */
            if (t_thrd.walsender_cxt.response_switchover_requested || t_thrd.walsender_cxt.walsender_shutdown_requested)
                sleeptime = 100; /* 0.1s */

            /* Sleep until something happens or we time out */
            pgstat_report_activity(STATE_IDLE, NULL);
            t_thrd.int_cxt.ImmediateInterruptOK = true;
            CHECK_FOR_INTERRUPTS();

            if (sleeptime > half_timeout)
                sleeptime = half_timeout;

            WaitLatchOrSocket(&t_thrd.walsender_cxt.MyWalSnd->latch, wakeEvents, u_sess->proc_cxt.MyProcPort->sock,
                              sleeptime);
            if (!AM_WAL_STANDBY_SENDER) {
                SyncRepReleaseWaiters();
            }
            t_thrd.int_cxt.ImmediateInterruptOK = false;
        }

        if (!bSyncStat && !dummyStandbyMode) {
            if (XLByteEQ(GetFlushRecPtr(), t_thrd.walsender_cxt.sentPtr) && SyncRepRequested() &&
                most_available_sync == false) {
                bSyncStat = true;
                ereport(LOG, (errmsg("The primary and standby reached syncstat in WalSndLoop.")));
            }
        }

        /* In the streaming dr switchover, and complete the service truncation */
        if (g_instance.streaming_dr_cxt.isInSwitchover &&
            g_instance.streaming_dr_cxt.switchoverBarrierLsn != InvalidXLogRecPtr &&
            t_thrd.walsender_cxt.MyWalSnd->is_cross_cluster &&
            t_thrd.walsender_cxt.MyWalSnd->interactiveState >= SDRS_INTERACTION_BEGIN) {
            WalSndHadrSwitchoverRequest();
        }
        volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
        if (t_thrd.postmaster_cxt.HaShmData->is_hadr_main_standby) {
            /* In distributed streaming dr cluster, shutdown walsender of main standby when term is changed */
            if (IS_MULTI_DISASTER_RECOVER_MODE && walsnd->isTermChanged) {
                ereport(LOG, (errmsg("Shutdown walsender of main standby due to the term change.")));
                SpinLockAcquire(&walsnd->mutex);
                walsnd->isTermChanged = false;
                SpinLockRelease(&walsnd->mutex);
                break;
            }
            /* In streaming dr cluster, send keepalive msg to cascade standby to refresh db state */
            if (walsnd->sendKeepalive) {
                WalSndKeepalive(false);
                SpinLockAcquire(&walsnd->mutex);
                walsnd->sendKeepalive = false;
                SpinLockRelease(&walsnd->mutex);
            }
        }
    }

    t_thrd.utils_cxt.CurrentResourceOwner = tmpOwner;
    WalSndShutdown();
    return 1; /* keep the compiler quiet */
}

/*
 * Compute how long send/receive loops should sleep.
 *
 * If wal_sender_timeout is enabled we want to wake up in time to send
 * keepalives and to abort the connection if wal_sender_timeout has been
 * reached.
 */
static long WalSndComputeSleeptime(TimestampTz now)
{
    /*
     * Formally, sleep time is set according to wal sender timeout.
     * Time is too long and sender can only be waked up when latch
     * is set, resulting in poor performance. Here reduced to 1s.
     */
    long sleeptime = 1000;
    int timeout = WalSndTimeout();

    if (timeout > 0 && t_thrd.walsender_cxt.last_reply_timestamp > 0) {
        TimestampTz wakeup_time;
        long sec_to_timeout;
        int microsec_to_timeout;

        /*
         * At the latest stop sleeping once wal_sender_timeout has been
         * reached.
         */
        wakeup_time = TimestampTzPlusMilliseconds(t_thrd.walsender_cxt.last_reply_timestamp, timeout);

        /*
         * If no ping has been sent yet, wakeup when it's time to do so.
         * DataSndKeepaliveIfNecessary() wants to send a keepalive once half of
         * the timeout passed without a response.
         */
        if (!t_thrd.walsender_cxt.waiting_for_ping_response)
            wakeup_time = TimestampTzPlusMilliseconds(t_thrd.walsender_cxt.last_reply_timestamp, timeout / 2);

        /* Compute relative time until wakeup. */
        TimestampDifference(now, wakeup_time, &sec_to_timeout, &microsec_to_timeout);

        sleeptime = sec_to_timeout * 1000 + microsec_to_timeout / 1000;
    }

    return sleeptime;
}

/*
 * Check if time since last write xlog of logical slot advancing has reached the limit.
 * If reached, write a new xlog.
 */
static void WalSndWriteLogicalAdvanceXLog(TimestampTz now)
{
    TimestampTz timegap;
    if (t_thrd.walsender_cxt.last_logical_xlog_advanced_timestamp <= 0)
        return;

    timegap = TimestampTzPlusMilliseconds(t_thrd.walsender_cxt.last_logical_xlog_advanced_timestamp,
                                          t_thrd.walsender_cxt.logical_xlog_advanced_timeout);
    if (t_thrd.walsender_cxt.logical_xlog_advanced_timeout > 0 && now >= timegap) {
        ereport(LOG, (errmsg("write xlog of logical slot advanced")));
        log_slot_advance(&t_thrd.slot_cxt.MyReplicationSlot->data);
        t_thrd.walsender_cxt.last_logical_xlog_advanced_timestamp = now;
    }
}

static TimestampTz GetHeartbeatLastReplyTimestamp()
{
    int replindex;
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    SpinLockAcquire(&walsnd->mutex);
    replindex = walsnd->channel_get_replc;
    SpinLockRelease(&walsnd->mutex);

    return get_last_reply_timestamp(replindex);
}

/* return timeout time */
static inline TimestampTz CalculateTimeout(TimestampTz last_reply_time)
{
    return TimestampTzPlusMilliseconds(last_reply_time, WalSndTimeout());
}

/*
 * Check if time since last receive from standby has reached the
 * configured limit.
 */
static void WalSndCheckTimeOut(TimestampTz now)
{
    TimestampTz timeout;

    /* don't bail out if we're doing something that doesn't require timeouts */
    if (WalSndTimeout() <= 0 || t_thrd.walsender_cxt.last_reply_timestamp <= 0) {
        return;
    }

    /*
     * Use last_check_timeout_timestamp to avoid call GetHeartbeatLastReplyTimestamp frequently
     * when t_thrd.walsender_cxt.last_reply_timestamp has meet the timeout condition
     * but last heartbeat time doesn't.
     */
    TimestampTz *last_reply_time = &t_thrd.walsender_cxt.last_check_timeout_timestamp;
    /* t_thrd.walsender_cxt.last_reply_timestamp newer */
    if (timestamptz_cmp_internal(t_thrd.walsender_cxt.last_reply_timestamp, *last_reply_time) > 0) {
        *last_reply_time = t_thrd.walsender_cxt.last_reply_timestamp;
    }

    timeout = CalculateTimeout(*last_reply_time);
    if (now < timeout) {
        return;
    }

    TimestampTz heartbeat = GetHeartbeatLastReplyTimestamp();
    /* If heartbeat newer, use heartbeat to recalculate timeout. */
    if (timestamptz_cmp_internal(heartbeat, *last_reply_time) > 0) {
        *last_reply_time = heartbeat;
        timeout = CalculateTimeout(*last_reply_time);
    }

    if (now >= timeout) {
        /*
         * Since typically expiration of replication timeout means
         * communication problem, we don't send the error message to the
         * standby.
         */
        WalReplicationTimestampInfo timeStampInfo;
        WalReplicationTimestampToString(&timeStampInfo, now, timeout, *last_reply_time, heartbeat);
        ereport(COMMERROR, (errmsg("terminating Walsender process due to replication timeout."),
                       (errdetail("now time(%s) timeout time(%s) last recv time(%s) heartbeat time(%s)",
                                  timeStampInfo.nowTimeStamp, timeStampInfo.timeoutStamp,
                                  timeStampInfo.lastRecStamp, timeStampInfo.heartbeatStamp)),
                       (errhint("try increasing %s or check system time.",
                                AM_WAL_DB_SENDER ? "logical_sender_timeout" : "wal_sender_timeout"))));
        WalSndShutdown();
    }
}

/* Initialize a per-walsender data structure for this walsender process */
static void InitWalSnd(void)
{
    int i;
    errno_t rc = 0;

    /*
     * WalSndCtl should be set up already (we inherit this by fork() or
     * EXEC_BACKEND mechanism from the postmaster).
     */
    Assert(t_thrd.walsender_cxt.WalSndCtl != NULL);
    Assert(t_thrd.walsender_cxt.MyWalSnd == NULL);

    /*
     * Find a free walsender slot and reserve it. If this fails, we must be
     * out of WalSnd structures.
     */
    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];

        SpinLockAcquire(&walsnd->mutex);

        if (walsnd->pid != 0) {
            SpinLockRelease(&walsnd->mutex);
            continue;
        } else {
            /*
             * Found a free slot. Reserve it for us.
             */
            walsnd->pid = t_thrd.proc_cxt.MyProcPid;
            rc = memset_s((void *)&walsnd->sentPtr, sizeof(XLogRecPtr), 0, sizeof(XLogRecPtr));
            securec_check(rc, "", "");
            walsnd->state = WALSNDSTATE_STARTUP;
            walsnd->node_state = NODESTATE_NORMAL;
            if (dummyStandbyMode) {
                walsnd->sendRole = SNDROLE_DUMMYSTANDBY_STANDBY;
            } else if (t_thrd.postmaster_cxt.senderToDummyStandby) {
                walsnd->sendRole = SNDROLE_PRIMARY_DUMMYSTANDBY;
            } else if (t_thrd.postmaster_cxt.senderToBuildStandby) {
                walsnd->sendRole = SNDROLE_PRIMARY_BUILDSTANDBY;
            } else if (AM_WAL_DB_SENDER) {
                walsnd->sendRole = SNDROLE_LOGICAL_SENDER;
            } else {
                walsnd->sendRole = SNDROLE_PRIMARY_STANDBY;
            }

            walsnd->sendKeepalive = false;
            walsnd->replSender = false;
            walsnd->peer_role = UNKNOWN_MODE;
            if (AM_WAL_HADR_SENDER || AM_WAL_HADR_CN_SENDER) {
                walsnd->is_cross_cluster = true;
                walsnd->interactiveState = SDRS_DEFAULT;
                walsnd->isMasterInstanceReady = false;
                walsnd->lastRequestTimestamp = GetCurrentTimestamp();
                rc = memset_s(g_instance.streaming_dr_cxt.targetBarrierId, MAX_BARRIER_ID_LENGTH, 0,
                              sizeof(g_instance.streaming_dr_cxt.targetBarrierId));
                securec_check(rc, "\0", "\0");
                SpinLockAcquire(&g_instance.streaming_dr_cxt.mutex);
                rc = memset_s(g_instance.streaming_dr_cxt.currentBarrierId, MAX_BARRIER_ID_LENGTH, 0,
                              sizeof(g_instance.streaming_dr_cxt.currentBarrierId));
                SpinLockRelease(&g_instance.streaming_dr_cxt.mutex);
                securec_check(rc, "\0", "\0");
            }
            walsnd->isTermChanged = false;
            walsnd->peer_state = NORMAL_STATE;
            walsnd->channel_get_replc = 0;
            rc = memset_s((void *)&walsnd->receive, sizeof(XLogRecPtr), 0, sizeof(XLogRecPtr));
            securec_check(rc, "", "");
            rc = memset_s((void *)&walsnd->write, sizeof(XLogRecPtr), 0, sizeof(XLogRecPtr));
            securec_check(rc, "", "");
            rc = memset_s((void *)&walsnd->flush, sizeof(XLogRecPtr), 0, sizeof(XLogRecPtr));
            securec_check(rc, "", "");
            rc = memset_s((void *)&walsnd->apply, sizeof(XLogRecPtr), 0, sizeof(XLogRecPtr));
            securec_check(rc, "", "");
            rc = memset_s((void *)&walsnd->data_flush, sizeof(XLogRecPtr), 0, sizeof(XLogRecPtr));
            securec_check(rc, "", "");
            rc = memset_s((void *)&walsnd->wal_sender_channel, sizeof(ReplConnInfo), 0, sizeof(ReplConnInfo));
            securec_check(rc, "", "");
            walsnd->sync_standby_group = 0;
            walsnd->sync_standby_priority = 0;
            walsnd->index = i;
            walsnd->log_ctrl.sleep_time = 0;
            walsnd->log_ctrl.balance_sleep_time = 0;
            walsnd->log_ctrl.prev_RTO = -1;
            walsnd->log_ctrl.current_RTO = -1;
            walsnd->log_ctrl.sleep_count = 0;
            walsnd->log_ctrl.sleep_count_limit = MAX_CONTROL_REPLY;
            walsnd->log_ctrl.prev_flush = 0;
            walsnd->log_ctrl.prev_apply = 0;
            walsnd->log_ctrl.period_total_flush = 0;
            walsnd->log_ctrl.period_total_apply = 0;
            walsnd->log_ctrl.local_prev_flush = 0;
            walsnd->log_ctrl.prev_reply_time = 0;
            walsnd->log_ctrl.prev_calculate_time = 0;
            walsnd->log_ctrl.flush_rate = 0;
            walsnd->log_ctrl.apply_rate = 0;
            walsnd->log_ctrl.local_flush_rate = 0;
            walsnd->log_ctrl.prev_RPO = -1;
            walsnd->log_ctrl.current_RPO = -1;
            walsnd->log_ctrl.prev_send_time = 0;
            walsnd->archive_task_count = 0;
            walsnd->archive_task_list = NULL;
            walsnd->lastCalTime = 0;
            walsnd->lastCalWrite = InvalidXLogRecPtr;
            walsnd->catchupRate = 0;
            walsnd->slot_idx = -1;
            walsnd->lastReceiveChangeTime = 0;
            walsnd->lastWriteChangeTime = 0;
            walsnd->lastFlushChangeTime = 0;
            walsnd->lastApplyChangeTime = 0;
            SpinLockRelease(&walsnd->mutex);
            /* don't need the lock anymore */
            OwnLatch((Latch *)&walsnd->latch);
            t_thrd.walsender_cxt.MyWalSnd = (WalSnd *)walsnd;

            break;
        }
    }
    if (t_thrd.walsender_cxt.MyWalSnd == NULL)
        ereport(FATAL, (errcode(ERRCODE_TOO_MANY_CONNECTIONS), errmsg("number of requested standby connections "
                                                                      "exceeds max_wal_senders (currently %d)",
                                                                      g_instance.attr.attr_storage.max_wal_senders)));

    /* Arrange to clean up at walsender exit */
    on_shmem_exit(WalSndKill, 0);
}

/* Mark WalSnd struct no longer in use. */
static void WalSndReset(WalSnd *walsnd)
{
    errno_t rc = 0;

    SpinLockAcquire(&walsnd->mutex);
    walsnd->pid = 0;
    walsnd->lwpId = 0;
    walsnd->peer_role = UNKNOWN_MODE;
    walsnd->replSender = false;
    walsnd->wal_sender_channel.localport = 0;
    walsnd->wal_sender_channel.remoteport = 0;
    walsnd->channel_get_replc = 0;
    walsnd->is_cross_cluster = false;
    walsnd->isTermChanged = false;
    rc = memset_s(walsnd->wal_sender_channel.localhost, sizeof(walsnd->wal_sender_channel.localhost), 0,
                  sizeof(walsnd->wal_sender_channel.localhost));
    securec_check_c(rc, "\0", "\0");
    rc = memset_s(walsnd->wal_sender_channel.remotehost, sizeof(walsnd->wal_sender_channel.remotehost), 0,
                  sizeof(walsnd->wal_sender_channel.remotehost));
    securec_check_c(rc, "\0", "\0");
    SpinLockRelease(&walsnd->mutex);
}

/* Destroy the per-walsender data structure for this walsender process */
static void WalSndKill(int code, Datum arg)
{
    WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

    Assert(walsnd != NULL);

    /* Clean the connection for advance logical replication slot. */
    CloseLogicalAdvanceConnect();

    /*
     * Clear MyWalSnd first; then disown the latch.  This is so that signal
     * handlers won't try to touch the latch after it's no longer ours.
     */
    t_thrd.walsender_cxt.MyWalSnd = NULL;

    DisownLatch(&walsnd->latch);

    if (code > 0) {
        /* Sleep at least 0.1 second to wait for reporting the error to the client */
        pg_usleep(100000L);
    }

    if (dummyStandbyMode) {
        set_failover_host_conninfo_for_dummy(walsnd->wal_sender_channel.remotehost, t_thrd.walsender_cxt.remotePort);
        t_thrd.walsender_cxt.remotePort = 0;
    }

    /* reset replication slot status to inactive here. */
    CleanMyReplicationSlot();

    /* Mark WalSnd struct no longer in use. */
    WalSndReset(walsnd);

    /*
     * Here one standby is going down, then check if it was synchronous
     * standby and also there is no more synchronous standby, if yes
     * then wake all waiting transaction and also change the master
     * mode to standalone. Should check lock is held or not already to
     * prevent deadlock. (e.g., fatal occurs when lock held and then
     * re-acquire the same lock when process exits)
     */
    if (LWLockHeldByMe(SyncRepLock)) {
        LWLockRelease(SyncRepLock);
    }
    LWLockAcquire(SyncRepLock, LW_EXCLUSIVE);
    SyncRepCheckSyncStandbyAlive();
    LWLockRelease(SyncRepLock);

    /* Close open wal file */
    if (t_thrd.walsender_cxt.sendFile >= 0) {
        (void)close(t_thrd.walsender_cxt.sendFile);
        t_thrd.walsender_cxt.sendFile = -1;
    }

    /*
     * Try to wake up walsenders which are in WaitLatchOrSocket of WalSndLoop.
     * Or they would be woken up only by walwriter, which may cause that workers
     * are not woken up in time.
     */
    WalSndWakeup();

    t_thrd.walsender_cxt.wsXLogJustSendRegion->start_ptr = InvalidXLogRecPtr;
    t_thrd.walsender_cxt.wsXLogJustSendRegion->end_ptr = InvalidXLogRecPtr;

    if (BBOX_BLACKLIST_XLOG_MESSAGE_SEND) {
        bbox_blacklist_remove(XLOG_MESSAGE_SEND, t_thrd.walsender_cxt.output_xlog_message);
    }
    if (XlogCopyStartPtr != InvalidXLogRecPtr) {
        LWLockAcquire(FullBuildXlogCopyStartPtrLock, LW_EXCLUSIVE);
        XlogCopyStartPtr = InvalidXLogRecPtr;
        LWLockRelease(FullBuildXlogCopyStartPtrLock);
    }

    ereport(LOG, (errmsg("walsender thread shut down")));
}

/*
 * Handle a client's connection abort in an orderly manner.
 */
static void WalSndShutdown(void)
{
    /*
     * Reset whereToSendOutput to prevent ereport from attempting to send any
     * more messages to the standby.
     */
    ereport(LOG, (errmsg("wal send shut down !\n")));
    if (t_thrd.postgres_cxt.whereToSendOutput == DestRemote)
        t_thrd.postgres_cxt.whereToSendOutput = DestNone;

    proc_exit(0);
    abort(); /* keep the compiler quiet */
}

/*
 * Read 'count' bytes from WAL into 'buf', starting at location 'startptr'.
 * XXX probably this should be improved to suck data directly from the
 * WAL buffers when possible. Will open, and keep open, one WAL segment
 * stored in the global file descriptor sendFile. This means if XLogRead is used
 * once, there will always be one descriptor left open until the process ends, but never
 * more than one.
 */
static void XLogRead(char *buf, XLogRecPtr startptr, Size count)
{
    char *p = NULL;
    XLogRecPtr recptr;
    Size nbytes;
    XLogSegNo segno;

retry:
    p = buf;
    recptr = startptr;
    nbytes = count;

    while (nbytes > 0) {
        uint32 startoff;
        int segbytes;
        int readbytes;
        bool need_read = true;

        startoff = recptr % XLogSegSize;

        /* Do we need to switch to a different xlog segment? */
        if (t_thrd.walsender_cxt.sendFile < 0 || !XLByteInSeg(recptr, t_thrd.walsender_cxt.sendSegNo)) {
            char path[MAXPGPATH];

            if (t_thrd.walsender_cxt.sendFile >= 0) {
                (void)close(t_thrd.walsender_cxt.sendFile);
            }

            XLByteToSeg(recptr, t_thrd.walsender_cxt.sendSegNo);
            XLogFilePath(path, MAXPGPATH, t_thrd.xlog_cxt.ThisTimeLineID, t_thrd.walsender_cxt.sendSegNo);

            t_thrd.walsender_cxt.sendFile = BasicOpenFile(path, O_RDONLY | PG_BINARY, 0);
            if (t_thrd.walsender_cxt.sendFile < 0) {
                /*
                 * If the file is not found, assume it's because the standby
                 * asked for a too old WAL segment that has already been
                 * removed or recycled.
                 */
                if (FILE_POSSIBLY_DELETED(errno)) {
                    /* we suppose wal segments removed happend when we can't open the xlog file. */
                    WalSegmemtRemovedhappened = true;
                    ereport(ERROR,
                            (errcode_for_file_access(),
                             errmsg("requested WAL segment %s has already been removed",
                                    XLogFileNameP(t_thrd.xlog_cxt.ThisTimeLineID, t_thrd.walsender_cxt.sendSegNo))));
                } else {
                    ereport(ERROR,
                            (errcode_for_file_access(),
                             errmsg("could not open file \"%s\" (log segment %s): %m", path,
                                    XLogFileNameP(t_thrd.xlog_cxt.ThisTimeLineID, t_thrd.walsender_cxt.sendSegNo))));
                }
            }
            t_thrd.walsender_cxt.sendOff = 0;
        }

        /* Need to seek in the file? */
        if (t_thrd.walsender_cxt.sendOff != startoff) {
            if (lseek(t_thrd.walsender_cxt.sendFile, (off_t)startoff, SEEK_SET) < 0) {
                (void)close(t_thrd.walsender_cxt.sendFile);
                t_thrd.walsender_cxt.sendFile = -1;
                ereport(ERROR, (errcode_for_file_access(),
                                errmsg("could not seek in log segment %s to offset %u: %m",
                                       XLogFileNameP(t_thrd.xlog_cxt.ThisTimeLineID, t_thrd.walsender_cxt.sendSegNo),
                                       startoff)));
            }
            t_thrd.walsender_cxt.sendOff = startoff;
        }

        /* How many bytes are within this segment? */
        if (nbytes > (XLogSegSize - startoff)) {
            segbytes = XLogSegSize - startoff;
        } else {
            segbytes = nbytes;
        }

        pgstat_report_waitevent(WAIT_EVENT_WAL_READ);
        /* consider O_DIRECT in dss mode */
        if (is_dss_fd(t_thrd.walsender_cxt.sendFile)) {
            off_t oldStartPos = dss_seek_file(t_thrd.walsender_cxt.sendFile, 0, SEEK_CUR);
            off_t movePos = oldStartPos % ALIGNOF_BUFFER;
            off_t newStartPos = oldStartPos - movePos;
            /* change current access position to newStartPos for O_DIRECT read */
            if (movePos != 0) {
                (void)dss_seek_file(t_thrd.walsender_cxt.sendFile, newStartPos, SEEK_SET);
                char *new_buff = (char*)palloc(movePos + segbytes);
                int new_read = read(t_thrd.walsender_cxt.sendFile, new_buff, movePos + segbytes);
                readbytes = new_read - (int)movePos;
                errno_t rc = memcpy_s(p, readbytes, new_buff + movePos, readbytes);
                securec_check(rc, "\0", "\0");
                pfree(new_buff);
                need_read = false;
            }
        }

        if (need_read) {
            readbytes = read(t_thrd.walsender_cxt.sendFile, p, segbytes);
        }
        pgstat_report_waitevent(WAIT_EVENT_END);
        if (readbytes <= 0) {
            (void)close(t_thrd.walsender_cxt.sendFile);
            t_thrd.walsender_cxt.sendFile = -1;
            ereport(ERROR, (errcode_for_file_access(),
                            errmsg("could not read from log segment %s, offset %u, length %lu: %m",
                                   XLogFileNameP(t_thrd.xlog_cxt.ThisTimeLineID, t_thrd.walsender_cxt.sendSegNo),
                                   t_thrd.walsender_cxt.sendOff, INT2ULONG(segbytes))));
        }

        /* Update state for read */
        XLByteAdvance(recptr, readbytes);

        t_thrd.walsender_cxt.sendOff += readbytes;
        nbytes -= readbytes;
        p += readbytes;
    }

    /*
     * After reading into the buffer, check that what we read was valid. We do
     * this after reading, because even though the segment was present when we
     * opened it, it might get recycled or removed while we read it. The
     * read() succeeds in that case, but the data we tried to read might
     * already have been overwritten with new WAL records.
     */
    XLByteToSeg(startptr, segno);
    CheckXLogRemoved(segno, t_thrd.xlog_cxt.ThisTimeLineID);

    /*
     * During recovery, the currently-open WAL file might be replaced with the
     * file of the same name retrieved from archive. So we always need to
     * check what we read was valid after reading into the buffer. If it's
     * invalid, we try to open and read the file again.
     */
    if (AM_WAL_STANDBY_SENDER) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
        bool reload = false;

        SpinLockAcquire(&walsnd->mutex);
        reload = walsnd->needreload;
        walsnd->needreload = false;
        SpinLockRelease(&walsnd->mutex);

        if (reload && t_thrd.walsender_cxt.sendFile >= 0) {
            (void)close(t_thrd.walsender_cxt.sendFile);
            t_thrd.walsender_cxt.sendFile = -1;

            goto retry;
        }
    }

    /* we open the xlog file success. it seems we are in good status. */
    WalSegmemtRemovedhappened = false;
}

/*
 * Handle logical log with type LOGICAL_LOG_COMMIT and LOGICAL_LOG_ABORT.
 */
static void LogicalLogHandleAbortOrCommit(ParallelReorderBuffer *prb, logicalLog *logChange, int slotId, bool isCommit)
{
    ParallelReorderBufferTXN *txn = NULL;

    txn = ParallelReorderBufferTXNByXid(prb, logChange->xid, true, NULL, logChange->lsn, true);
    if (txn == NULL) {
        ereport(LOG, (errmodule(MOD_LOGICAL_DECODE), errcode(ERRCODE_LOGICAL_DECODE_ERROR),
            errmsg("Logical log commit with no txn found")));
        FreeLogicalLog(prb, logChange, slotId, false);
        return;
    }
    txn->final_lsn = logChange->finalLsn;
    txn->nsubtxns = logChange->nsubxacts;
    txn->commit_time = logChange->commitTime;
    txn->origin_id = logChange->origin_id;

    bool isForget = false;
    if (XLByteLT(txn->final_lsn, g_Logicaldispatcher[slotId].startpoint) ||
        XLByteLT(logChange->lsn, t_thrd.walsender_cxt.firstConfirmedFlush) || !isCommit) {
        isForget = true;
    }
    for (int i = 0; i < logChange->nsubxacts; i++) {
        TransactionId subXid = logChange->subXids[i];
        ParallelReorderBufferTXN *subtxn =
            ParallelReorderBufferTXNByXid(prb, subXid, false, NULL, InvalidXLogRecPtr, false);
        if (subtxn == NULL) {
            continue;
        }

        subtxn->final_lsn = logChange->finalLsn;
        subtxn->commit_time = logChange->commitTime;

        if (!subtxn->is_known_as_subxact) {
            dlist_delete(&subtxn->node);
            subtxn->is_known_as_subxact = true;
            dlist_push_tail(&txn->subtxns, &subtxn->node);
        }
    }

    if (isForget) {
        ParallelReorderBufferForget(prb, slotId, txn);
    } else {
        ParallelReorderBufferCommit(prb, logChange, slotId, txn);
    }
    FreeLogicalLog(prb, logChange, slotId, false);
}

/*
 * Poll and read the logical log queue of each decoder thread.
 * Send to the client after processing.
 */
void LogicalLogHandle(ParallelReorderBuffer *prb, logicalLog *logChange)
{
    int slotId = t_thrd.walsender_cxt.LogicalSlot;
    ParallelDecodeReaderWorker* readWorker = g_Logicaldispatcher[slotId].readWorker;

    switch (logChange->type) {
        case LOGICAL_LOG_EMPTY: {
            FreeLogicalLog(prb, logChange, slotId, false);
            break;
        }
        case LOGICAL_LOG_DML: {
            ParallelReorderBufferQueueChange(prb, logChange, slotId);
            break;
        }
        case LOGICAL_LOG_RUNNING_XACTS: {
            ParallelReorderBufferTXN *txn = NULL;
            txn = ParallelReorderBufferGetOldestTXN(prb);
            /*
             * oldest ongoing txn might have started when we didn't yet serialize
             * anything because we hadn't reached a consistent state yet.
             */
            prb->lastRunningXactOldestXmin = logChange->oldestXmin;
            SpinLockAcquire(&(readWorker->rwlock));
            readWorker->current_lsn = logChange->lsn;
            prb->current_restart_decoding_lsn = logChange->lsn;

            /*
             * Every time the running Xact log is decoded,
             * the LSN and xmin in the decoding log are recorded and
             * pre pushed in the parallel logical reader thread.
             */
            if (txn == NULL) {
                readWorker->restart_lsn = logChange->lsn;
                readWorker->candidate_oldest_xmin = logChange->oldestXmin;
            } else {
                readWorker->restart_lsn = txn->restart_decoding_lsn;
                readWorker->candidate_oldest_xmin = txn->oldestXid;
            }

            ereport(DEBUG2, (errmodule(MOD_LOGICAL_DECODE), errcode(ERRCODE_LOGICAL_DECODE_ERROR),
                errmsg("LogicalLogHandle restart_lsn at %X/%X, current_lsn %X/%X.",
                    (uint32)(readWorker->restart_lsn >> 32),
                    (uint32)readWorker->restart_lsn,
                    (uint32)(readWorker->current_lsn >> 32),
                    (uint32)readWorker->current_lsn)));
            readWorker->candidate_oldest_xmin_lsn = logChange->lsn;
            SpinLockRelease(&(readWorker->rwlock));
            /*
             * Iterate through all (potential) toplevel TXNs and abort all that are
             * older than what possibly can be running.
             */
            while (true) {
                ParallelReorderBufferTXN *txn = ParallelReorderBufferGetOldestTXN(prb);
                if (txn != NULL && txn->xid < logChange->oldestXmin) {
                    ereport(DEBUG2, (errmodule(MOD_LOGICAL_DECODE), errmsg("aborting old transaction %lu", txn->xid)));

                    /* remove potential on-disk data, and deallocate this tx */
                    ParallelReorderBufferForget(prb, slotId, txn);
                } else {
                    break;
                }
            }
            FreeLogicalLog(prb, logChange, slotId, false);
            break;
        }
        case LOGICAL_LOG_COMMIT: {
            LogicalLogHandleAbortOrCommit(prb, logChange, slotId, true);
            break;
        }

        case LOGICAL_LOG_ABORT: {
            LogicalLogHandleAbortOrCommit(prb, logChange, slotId, false);
            break;
        }
        case LOGICAL_LOG_CONFIRM_FLUSH: {
            t_thrd.walsender_cxt.sentPtr = logChange->lsn;
            t_thrd.walsender_cxt.firstConfirmedFlush = logChange->lsn;
            ereport(LOG, (errmodule(MOD_LOGICAL_DECODE), errcode(ERRCODE_UNRECOGNIZED_NODE_TYPE),
                errmsg("t_thrd.walsender_cxt.sentPtr %lu", t_thrd.walsender_cxt.sentPtr)));
            break;
        }
        case LOGICAL_LOG_NEW_CID: {
            ParallelReorderBufferQueueChange(prb, logChange, slotId);
            break;
        }
        case LOGICAL_LOG_MISSING_CHUNK: {
            ParallelReorderBufferQueueChange(prb, logChange, slotId);
            break;
        }
        case LOGICAL_LOG_ASSIGNMENT: {
            ParallelReorderBufferChildAssignment(prb, logChange);
            FreeLogicalLog(prb, logChange, slotId, false);
            break;
        }
        default:
            break;
    }
}

/*
 * Get the logical logs in logical queue in turn, and send them after processing.
 */
void XLogSendParallelLogical()
{
    int slotId = t_thrd.walsender_cxt.LogicalSlot;

    if (t_thrd.slot_cxt.MyReplicationSlot == NULL && g_Logicaldispatcher[slotId].MyReplicationSlot != NULL) {
        t_thrd.slot_cxt.MyReplicationSlot = g_Logicaldispatcher[slotId].MyReplicationSlot;
    }

    /*
     * Initialize when entering the loop for the first time.
     * Ensure to get the correct logical log in logical queue every time.
     */
    if (g_Logicaldispatcher[slotId].firstLoop) {
        g_Logicaldispatcher[slotId].id = 0;
        g_Logicaldispatcher[slotId].firstLoop = false;
    }
    ParallelReorderBuffer *prb = t_thrd.walsender_cxt.parallel_logical_decoding_ctx->reorder;

    /* After 1 second with no new transactions, all decoded results should be sent automatically. */
    {
        const int expTime = 1000;
        ParallelLogicalDecodingContext *ctx = (ParallelLogicalDecodingContext *)prb->private_data;
        if (TimestampDifferenceExceeds(g_Logicaldispatcher[slotId].decodeTime, GetCurrentTimestamp(), expTime) &&
            g_Logicaldispatcher[slotId].remainPatch) {
            if (g_Logicaldispatcher[slotId].pOptions.decode_style == 'b' ||
                g_Logicaldispatcher[slotId].pOptions.sending_batch > 0) {
                pq_sendint32(ctx->out, 0); /* We send a zero to display that no other decoding result is followed */
            }
            WalSndWriteDataHelper(ctx->out, 0, 0, false);
            g_Logicaldispatcher[slotId].remainPatch = false;
            t_thrd.walsender_cxt.sentPtr = pg_atomic_read_u64(&g_Logicaldispatcher[slotId].sentPtr);
            WalSndKeepalive(false);
            g_Logicaldispatcher[slotId].decodeTime = GetCurrentTimestamp();
        } else if (TimestampDifferenceExceeds(g_Logicaldispatcher[slotId].decodeTime, GetCurrentTimestamp(), expTime)) {
            t_thrd.walsender_cxt.sentPtr = pg_atomic_read_u64(&g_Logicaldispatcher[slotId].sentPtr);
            WalSndKeepalive(false);
            g_Logicaldispatcher[slotId].decodeTime = GetCurrentTimestamp();
        }
    }

    /*
     * Poll from all decoder threads to get logical logs.
     * Since the reader polls the logs sent to the decode thread,
     * the logical logs obtained by polling are in order.
     */
    for (;; g_Logicaldispatcher[slotId].id = (g_Logicaldispatcher[slotId].id + 1) % GetDecodeParallelism(slotId)) {

        if (g_Logicaldispatcher[slotId].abnormal) {
            /*
             * Exit the current thread. When a thread in the thread group exits abnormally
             */
            knl_g_parallel_decode_context *pDecodeCxt = &g_instance.comm_cxt.pdecode_cxt[slotId];
            if (pDecodeCxt->edata != NULL) {
                ReThrowError(pDecodeCxt->edata);
            } else {
                ereport(ERROR, (errmodule(MOD_LOGICAL_DECODE),
                    errmsg("walsender send SIGTERM to all parallel logical threads.")));
            }
        }

        ParallelDecodeWorker* decodeWorker = g_Logicaldispatcher[slotId].decodeWorkers[g_Logicaldispatcher[slotId].id];
        logicalLog *logChange = (logicalLog*)LogicalQueueTop(decodeWorker->LogicalLogQueue);

        if (logChange != NULL) {
            LogicalLogHandle(prb, logChange);
            LogicalQueuePop(decodeWorker->LogicalLogQueue);
        } else {
            volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
            SpinLockAcquire(&walsnd->mutex);
            walsnd->sentPtr = t_thrd.walsender_cxt.sentPtr;
            SpinLockRelease(&walsnd->mutex);
            return;
        }
    }
}

/*
 * Stream out logically decoded data.
 */
static void XLogSendLogical(void)
{
    XLogRecord *record = NULL;
    char *errm = NULL;

    /*
     * Don't know whether we've caught up yet. We'll set it to true in
     * WalSndWaitForWal, if we're actually waiting. We also set to true if
     * XLogReadRecord() had to stop reading but WalSndWaitForWal didn't wait -
     * i.e. when we're shutting down.
     */
    t_thrd.walsender_cxt.walSndCaughtUp = false;

    record = XLogReadRecord(t_thrd.walsender_cxt.logical_decoding_ctx->reader, t_thrd.walsender_cxt.logical_startptr,
                            &errm);
    t_thrd.walsender_cxt.logical_startptr = InvalidXLogRecPtr;

    /* xlog record was invalid */
    if (errm != NULL)
        ereport(ERROR, (errcode(ERRCODE_LOGICAL_DECODE_ERROR),
                        errmsg("Stopped to parse any valid XLog Record at %X/%X: %s.",
                               (uint32)(t_thrd.walsender_cxt.logical_decoding_ctx->reader->EndRecPtr >> 32),
                               (uint32)t_thrd.walsender_cxt.logical_decoding_ctx->reader->EndRecPtr, errm)));

    if (record != NULL) {
        LogicalDecodingProcessRecord(t_thrd.walsender_cxt.logical_decoding_ctx,
                                     t_thrd.walsender_cxt.logical_decoding_ctx->reader);

        t_thrd.walsender_cxt.sentPtr = t_thrd.walsender_cxt.logical_decoding_ctx->reader->EndRecPtr;
    } else {
        /*
         * If the record we just wanted read is at or beyond the flushed point,
         * then we're caught up.
         */
        if (t_thrd.walsender_cxt.logical_decoding_ctx->reader->EndRecPtr >= GetFlushRecPtr())
            t_thrd.walsender_cxt.walSndCaughtUp = true;
    }

    /* Update shared memory status */
    {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

        SpinLockAcquire(&walsnd->mutex);
        walsnd->sentPtr = t_thrd.walsender_cxt.sentPtr;
        SpinLockRelease(&walsnd->mutex);
    }
}

/*
 * Read up to MAX_SEND_SIZE bytes of WAL that's been flushed to disk,
 * but not yet sent to the client, and buffer it in the libpq output buffer.
 *
 * If there is no unsent WAL remaining, *caughtup is set to true, otherwise
 * *caughtup is set to false.
 */
static void XLogSendPhysical(void)
{
    XLogRecPtr SendRqstPtr = InvalidXLogRecPtr;
    XLogRecPtr startptr = InvalidXLogRecPtr;
    XLogRecPtr endptr = InvalidXLogRecPtr;
    XLogRecPtr receivePtr;
    XLogRecPtr writePtr;
    XLogRecPtr flushPtr;
    XLogRecPtr replayPtr;
    bool amSync = false;
    Size nbytes = 0;
    WalDataMessageHeader msghdr;
    ServerMode local_role;
    bool got_recptr = false;
    volatile HaShmemData *hashmdata = t_thrd.postmaster_cxt.HaShmData;
    errno_t errorno = EOK;

    t_thrd.walsender_cxt.catchup_threshold = 0;

    /*
     * Attempt to send all data that's already been written out and fsync'd to
     * disk.  We cannot go further than what's been written out given the
     * current implementation of XLogRead().  And in any case it's unsafe to
     * send WAL that is not securely down to disk on the master: if the master
     * subsequently crashes and restarts, slaves must not have applied any WAL
     * that gets lost on the master.
     */
    if (AM_WAL_STANDBY_SENDER) {
        TimeLineID currentTargetTLI;
        SendRqstPtr = GetStandbyFlushRecPtr(&currentTargetTLI);

        /*
         * If the recovery target timeline changed, bail out. It's a bit
         * unfortunate that we have to just disconnect, but there is no way
         * to tell the client that the timeline changed. We also don't know
         * exactly where the switch happened, so we cannot safely try to send
         * up to the switchover point before disconnecting.
         */
        if (currentTargetTLI != t_thrd.xlog_cxt.ThisTimeLineID) {
            if (!t_thrd.walsender_cxt.walsender_ready_to_stop)
                ereport(LOG, (errmsg("terminating walsender process to force cascaded standby "
                                     "to update timeline and reconnect")));
            t_thrd.walsender_cxt.walsender_ready_to_stop = true;
            t_thrd.walsender_cxt.walSndCaughtUp = true;
            return;
        }
    } else if (dummyStandbyMode) {
        SendRqstPtr = GetWalRcvWriteRecPtr(NULL);
    } else if (USE_SYNC_REP_FLUSH_PTR && !t_thrd.postmaster_cxt.senderToBuildStandby) {
        got_recptr = SyncRepGetSyncRecPtr(&receivePtr, &writePtr, &flushPtr, &replayPtr, &amSync, false);
        if (!got_recptr) {
            ereport(ERROR,
                (errmsg("WAL sender for HADR could not find an appropriated location with SyncRepGetSyncRecPtr.")));
        }
        SendRqstPtr = flushPtr;
    } else {
        SendRqstPtr = GetFlushRecPtr();
    }

    /* Quick exit if nothing to do */
    if (!u_sess->attr.attr_storage.enable_stream_replication || XLByteLE(SendRqstPtr, t_thrd.walsender_cxt.sentPtr)) {
        t_thrd.walsender_cxt.walSndCaughtUp = true;
        return;
    }

    /*
     * Figure out how much to send in one message. If there's no more than
     * MAX_SEND_SIZE bytes to send, send everything. Otherwise send
     * MAX_SEND_SIZE bytes, but round back to logfile or page boundary.
     *
     * The rounding is not only for performance reasons. Walreceiver relies on
     * the fact that we never split a WAL record across two messages. Since a
     * long WAL record is split at page boundary into continuation records,
     * page boundary is always a safe cut-off point. We also assume that
     * SendRqstPtr never points to the middle of a WAL record.
     */
    startptr = t_thrd.walsender_cxt.sentPtr;
    endptr = startptr;
    XLByteAdvance(endptr, g_instance.attr.attr_storage.MaxSendSize * 1024);

    /* if we went beyond SendRqstPtr, back off */
    if (XLByteLE(SendRqstPtr, endptr)) {
        endptr = SendRqstPtr;
        t_thrd.walsender_cxt.walSndCaughtUp = true;
    } else {
        /* round down to page boundary. */
        endptr -= (endptr % XLOG_BLCKSZ);
        t_thrd.walsender_cxt.walSndCaughtUp = false;
        t_thrd.walsender_cxt.catchup_threshold = XLByteDifference(SendRqstPtr, endptr);
    }

    nbytes = endptr - startptr;
    Assert(nbytes <= (Size)g_instance.attr.attr_storage.MaxSendSize * 1024);

    if (nbytes == 0)
        ereport(NOTICE, (errmsg("streaming body is empty, "
                                "request send: %X/%X, already sent: %X/%X",
                                (uint32)(SendRqstPtr >> 32), (uint32)SendRqstPtr,
                                (uint32)(t_thrd.walsender_cxt.sentPtr >> 32), (uint32)t_thrd.walsender_cxt.sentPtr)));

    /*
     * OK to read and send the slice.
     */
    t_thrd.walsender_cxt.output_xlog_message[0] = 'w';

    /*
     * Read the log directly into the output buffer to avoid extra memcpy
     * calls.
     */

    /* read into temp buffer, compress, then copy to output buffer */
    int compressedSize = 0;

    if (AmWalSenderToStandby() && g_instance.attr.attr_storage.enable_wal_shipping_compression &&
        AM_WAL_HADR_DNCN_SENDER) {
        t_thrd.walsender_cxt.output_xlog_message[0] = 'C';
        XLogCompression(&compressedSize, startptr, nbytes);
    } else {
        XLogRead(t_thrd.walsender_cxt.output_xlog_message + 1 + sizeof(WalDataMessageHeader), startptr, nbytes);
        ereport(DEBUG5, (errmsg("conninfo:(%s,%d) start: %X/%X, end: %X/%X, %lu bytes",
                                t_thrd.walsender_cxt.MyWalSnd->wal_sender_channel.localhost,
                                t_thrd.walsender_cxt.MyWalSnd->wal_sender_channel.localport, (uint32)(startptr >> 32),
                                (uint32)startptr, (uint32)(endptr >> 32), (uint32)endptr, nbytes)));
    }

    /*
     * We fill the message header last so that the send timestamp is taken as
     * late as possible.
     */
    msghdr.dataStart = startptr;
    msghdr.walEnd = SendRqstPtr;
    msghdr.sendTime = GetCurrentTimestamp();
    msghdr.sender_sent_location = endptr;
    msghdr.catchup = (t_thrd.walsender_cxt.MyWalSnd->state == WALSNDSTATE_CATCHUP &&
        !t_thrd.walsender_cxt.walSndCaughtUp);
    SpinLockAcquire(&hashmdata->mutex);
    local_role = hashmdata->current_mode;
    SpinLockRelease(&hashmdata->mutex);
    if (local_role == PRIMARY_MODE) {
        /* Local role is a primary */
        msghdr.sender_flush_location = GetFlushRecPtr();
        msghdr.sender_replay_location = msghdr.sender_flush_location;
        msghdr.sender_write_location = GetXLogWriteRecPtr();
    } else {
        /* Local role is not a primary */
        msghdr.sender_write_location = GetWalRcvWriteRecPtr(NULL);
        msghdr.sender_flush_location = GetStandbyFlushRecPtr(NULL);
        msghdr.sender_replay_location = GetXLogReplayRecPtr(NULL);
    }

    errorno = memcpy_s(t_thrd.walsender_cxt.output_xlog_message + 1,
                       sizeof(WalDataMessageHeader) + g_instance.attr.attr_storage.MaxSendSize * 1024, &msghdr,
                       sizeof(WalDataMessageHeader));
    securec_check(errorno, "\0", "\0");
    LogCtrlSleep();

    if (t_thrd.walsender_cxt.output_xlog_message[0] == 'C') {
        (void)pq_putmessage_noblock('d', t_thrd.walsender_cxt.output_xlog_message,
                                    1 + sizeof(WalDataMessageHeader) + compressedSize);
    } else {
        (void)pq_putmessage_noblock('d', t_thrd.walsender_cxt.output_xlog_message,
                                    1 + sizeof(WalDataMessageHeader) + nbytes);
    }

    t_thrd.walsender_cxt.sentPtr = endptr;

    /* Update shared memory status */
    {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
        walsnd->log_ctrl.prev_send_time = GetCurrentTimestamp();
        SpinLockAcquire(&walsnd->mutex);
        walsnd->sentPtr = t_thrd.walsender_cxt.sentPtr;
        SpinLockRelease(&walsnd->mutex);
    }

    /* Report progress of XLOG streaming in PS display */
    if (u_sess->attr.attr_common.update_process_title) {
        char activitymsg[50];
        int rc = 0;

        rc = snprintf_s(activitymsg, sizeof(activitymsg), sizeof(activitymsg) - 1, "streaming %X/%X",
                        (uint32)(t_thrd.walsender_cxt.sentPtr >> 32), (uint32)t_thrd.walsender_cxt.sentPtr);
        securec_check_ss(rc, "\0", "\0");

        set_ps_display(activitymsg, false);
    }

    return;
}

void XLogCompression(int* compressedSize, XLogRecPtr startPtr, Size nbytes)
{
    /* for xlog shipping performances */
    char *xlogReadBuf = t_thrd.walsender_cxt.xlogReadBuf;
    char *compressedBuf = t_thrd.walsender_cxt.compressBuf;
    errno_t errorno = EOK;

    if (xlogReadBuf == NULL) {
        t_thrd.walsender_cxt.xlogReadBuf = (char *)palloc(1 + sizeof(WalDataMessageHeader) +
            (int)WS_MAX_SEND_SIZE);
        xlogReadBuf = t_thrd.walsender_cxt.xlogReadBuf;
    }
    if (compressedBuf == NULL) {
        t_thrd.walsender_cxt.compressBuf = (char *)palloc(1 + sizeof(WalDataMessageHeader) +
            (int)WS_MAX_SEND_SIZE);
        compressedBuf = t_thrd.walsender_cxt.compressBuf;
    }

    XLogRead(xlogReadBuf, startPtr, nbytes);
    *compressedSize = LZ4_compress_default(xlogReadBuf, compressedBuf, nbytes, LZ4_compressBound(nbytes));
    if (*compressedSize > g_instance.attr.attr_storage.MaxSendSize * 1024) {
        ereport(WARNING, (errmsg("[CompressWarning] compressed size big than MaxSendSize! startPtr %X/%X, "
                                 "originsize %ld, compressedSize %d, compressBound %d",
                                 (uint32)(startPtr >> 32), (uint32)startPtr, nbytes, *compressedSize,
                                 LZ4_compressBound(nbytes))));
        t_thrd.walsender_cxt.output_xlog_message[0] = 'w';
        errorno = memcpy_s(t_thrd.walsender_cxt.output_xlog_message + 1 + sizeof(WalDataMessageHeader),
            nbytes, xlogReadBuf, nbytes);
        securec_check(errorno, "\0", "\0");
        return;
    }
    if (*compressedSize <= 0) {
        ereport(WARNING, (errmsg("[CompressFailed] startPtr %X/%X, originsize %ld, compressedSize %d, compressBound %d",
                                 (uint32)(startPtr >> 32), (uint32)startPtr, nbytes, *compressedSize,
                                 LZ4_compressBound(nbytes))));
        t_thrd.walsender_cxt.output_xlog_message[0] = 'w';
        errorno = memcpy_s(t_thrd.walsender_cxt.output_xlog_message + 1 + sizeof(WalDataMessageHeader),
            nbytes, xlogReadBuf, nbytes);
        securec_check(errorno, "\0", "\0");
        return;
    }
    errorno = memcpy_s(t_thrd.walsender_cxt.output_xlog_message + 1 + sizeof(WalDataMessageHeader),
        *compressedSize, compressedBuf, *compressedSize);
    securec_check(errorno, "\0", "\0");
    ereport(DEBUG4, ((errmodule(MOD_REDO), errcode(ERRCODE_LOG),
        errmsg("[XLOG_COMPRESS] xlog compression working! startPtr %X/%X, origSize %ld, compressedSize %d",
        (uint32)(startPtr >> 32), (uint32)startPtr, nbytes, *compressedSize))));

}

/*
 * Request walsenders to reload the currently-open WAL file
 */
void WalSndRqstFileReload(void)
{
    int i;

    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];

        if (walsnd->pid == 0)
            continue;

        SpinLockAcquire(&walsnd->mutex);
        walsnd->needreload = true;
        SpinLockRelease(&walsnd->mutex);
    }
}

/* SIGHUP: set flag to re-read config file at next convenient time */
static void WalSndSigHupHandler(SIGNAL_ARGS)
{
    int save_errno = errno;

    t_thrd.walsender_cxt.got_SIGHUP = true;
    if (t_thrd.walsender_cxt.MyWalSnd)
        SetLatch(&t_thrd.walsender_cxt.MyWalSnd->latch);

    if (AM_WAL_DB_SENDER && t_thrd.walsender_cxt.LogicalSlot != -1) {
        int slotId = t_thrd.walsender_cxt.LogicalSlot;
        int parallelism = g_Logicaldispatcher[slotId].pOptions.parallel_decode_num;
        knl_g_parallel_decode_context *gDecodeCxt = g_instance.comm_cxt.pdecode_cxt;

        if (gDecodeCxt[slotId].ParallelReaderWorkerStatus.threadState == PARALLEL_DECODE_WORKER_RUN &&
            g_Logicaldispatcher[slotId].readWorker != NULL && g_Logicaldispatcher[slotId].readWorker->tid != 0) {
            signal_child(g_Logicaldispatcher[slotId].readWorker->tid, SIGHUP, -1);
        }
        for (int i = 0; i < parallelism; i++) {
            if (gDecodeCxt[slotId].ParallelDecodeWorkerStatusList[i].threadState == PARALLEL_DECODE_WORKER_RUN &&
                g_Logicaldispatcher[slotId].decodeWorkers != NULL &&
                g_Logicaldispatcher[slotId].decodeWorkers[i] != NULL &&
                g_Logicaldispatcher[slotId].decodeWorkers[i]->tid.thid != 0) {
                signal_child(g_Logicaldispatcher[slotId].decodeWorkers[i]->tid.thid, SIGHUP, -1);
            }
        }
    }
    errno = save_errno;
}

/* SIGTERM: set flag to shut down */
static void WalSndShutdownHandler(SIGNAL_ARGS)
{
    int save_errno = errno;

    t_thrd.walsender_cxt.walsender_shutdown_requested = true;
    if (t_thrd.walsender_cxt.MyWalSnd)
        SetLatch(&t_thrd.walsender_cxt.MyWalSnd->latch);

    /*
     * Set the standard (non-walsender) state as well, so that we can abort
     * things like do_pg_stop_backup().
     */
    InterruptPending = true;
    t_thrd.int_cxt.ProcDiePending = true;

    errno = save_errno;
}

/*
 * WalSndQuickDieHandler() occurs when signalled SIGQUIT by the postmaster.
 *
 * Some backend has bought the farm,
 * so we need to stop what we're doing and exit.
 */
static void WalSndQuickDieHandler(SIGNAL_ARGS)
{
    gs_signal_setmask(&t_thrd.libpq_cxt.BlockSig, NULL);

    /*
     * We DO NOT want to run proc_exit() callbacks -- we're here because
     * shared memory may be corrupted, so we don't want to try to clean up our
     * transaction.  Just nail the windows shut and get out of town.  Now that
     * there's an atexit callback to prevent third-party code from breaking
     * things by calling exit() directly, we have to reset the callbacks
     * explicitly to make this work as intended.
     */
    on_exit_reset();

    /*
     * Note we do exit(2) not exit(0).	This is to force the postmaster into a
     * system reset cycle if some idiot DBA sends a manual SIGQUIT to a random
     * backend.  This is necessary precisely because we don't clean up our
     * shared memory state.  (The "dead man switch" mechanism in pmsignal.c
     * should ensure the postmaster sees this as a crash, too, but no harm in
     * being doubly sure.)
     */
    exit(2);
}

/* SIGUSR1: set flag to send WAL records */
static void WalSndXLogSendHandler(SIGNAL_ARGS)
{
    int save_errno = errno;

    latch_sigusr1_handler();

    errno = save_errno;
}

/* SIGUSR2: set flag to do a last cycle and shut down afterwards */
static void WalSndLastCycleHandler(SIGNAL_ARGS)
{
    int save_errno = errno;

    t_thrd.walsender_cxt.walsender_ready_to_stop = true;
    if (t_thrd.walsender_cxt.MyWalSnd)
        SetLatch(&t_thrd.walsender_cxt.MyWalSnd->latch);

    if (IS_DN_DUMMY_STANDYS_MODE()) {
        if (t_thrd.walsender_cxt.MyWalSnd && !AmWalSenderToDummyStandby() &&
            (t_thrd.walsender_cxt.MyWalSnd->node_state == NODESTATE_PROMOTE_APPROVE ||
             t_thrd.walsender_cxt.MyWalSnd->node_state == NODESTATE_STANDBY_REDIRECT))
            t_thrd.walsender_cxt.response_switchover_requested = true;
    } else {
        if (t_thrd.walsender_cxt.MyWalSnd && t_thrd.walsender_cxt.MyWalSnd->node_state == NODESTATE_PROMOTE_APPROVE)
            t_thrd.walsender_cxt.response_switchover_requested = true;
    }

    errno = save_errno;
}

/* SIGCHILD: set child process status to EXIT */
static void WalSndSigChldHandler(SIGNAL_ARGS)
{
    if (t_thrd.role != WAL_DB_SENDER || t_thrd.walsender_cxt.LogicalSlot == -1) {
        return;
    }
    int slotId = t_thrd.walsender_cxt.LogicalSlot;
    knl_g_parallel_decode_context *gDecodeCxt = g_instance.comm_cxt.pdecode_cxt;
    ThreadId pid = gs_thread_id(t_thrd.postmaster_cxt.CurExitThread);
    for (int i = 0; i < gDecodeCxt[slotId].totalNum; i++) {
        if (gDecodeCxt[slotId].ParallelDecodeWorkerStatusList[i].threadId == pid) {
            gDecodeCxt[slotId].ParallelDecodeWorkerStatusList[i].threadState = PARALLEL_DECODE_WORKER_EXIT;
            break;
        }
    }
    if (gDecodeCxt[slotId].ParallelReaderWorkerStatus.threadId == pid) {
        gDecodeCxt[slotId].ParallelReaderWorkerStatus.threadState = PARALLEL_DECODE_WORKER_EXIT;
    }
    g_Logicaldispatcher[slotId].abnormal = true;
}

/* Set up signal handlers */
void WalSndSignals(void)
{
    /* Set up signal handlers */
    (void)gspqsignal(SIGHUP, WalSndSigHupHandler);    /* set flag to read config file */
    (void)gspqsignal(SIGINT, SIG_IGN);                /* not used */
    (void)gspqsignal(SIGTERM, WalSndShutdownHandler); /* request shutdown */
    (void)gspqsignal(SIGQUIT, WalSndQuickDieHandler); /* hard crash time */
    (void)gspqsignal(SIGALRM, handle_sig_alarm);
    (void)gspqsignal(SIGPIPE, SIG_IGN);
    (void)gspqsignal(SIGUSR1, WalSndXLogSendHandler);  /* request WAL sending */
    (void)gspqsignal(SIGUSR2, WalSndLastCycleHandler); /* request a last cycle and shutdown */
    (void)gspqsignal(SIGURG, print_stack);
    (void)gspqsignal(SIGCHLD, WalSndSigChldHandler);
    /* Reset some signals that are accepted by postmaster but not here */
    (void)gspqsignal(SIGTTIN, SIG_DFL);
    (void)gspqsignal(SIGTTOU, SIG_DFL);
    (void)gspqsignal(SIGCONT, SIG_DFL);
    (void)gspqsignal(SIGWINCH, SIG_DFL);
}

/* Report shared-memory space needed by WalSndShmemInit */
Size WalSndShmemSize(void)
{
    Size size = 0;

    size = offsetof(WalSndCtlData, walsnds);
    size = add_size(size, mul_size(g_instance.attr.attr_storage.max_wal_senders, sizeof(WalSnd)));

    return size;
}

/* Allocate and initialize walsender-related shared memory */
void WalSndShmemInit(void)
{
    bool found = false;
    errno_t rc = 0;
    int i;

    t_thrd.walsender_cxt.WalSndCtl = (WalSndCtlData *)ShmemInitStruct("Wal Sender Ctl", WalSndShmemSize(), &found);

    if (!found) {
        /* First time through, so initialize */
        rc = memset_s(t_thrd.walsender_cxt.WalSndCtl, WalSndShmemSize(), 0, WalSndShmemSize());
        securec_check(rc, "\0", "\0");

        for (i = 0; i < NUM_SYNC_REP_WAIT_MODE; i++)
            SHMQueueInit(&(t_thrd.walsender_cxt.WalSndCtl->SyncRepQueue[i]));

        SHMQueueInit(&(t_thrd.walsender_cxt.WalSndCtl->SyncPaxosQueue));

        for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
            WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];

            walsnd->sendKeepalive = false;
            SpinLockInit(&walsnd->mutex);
            InitSharedLatch(&walsnd->latch);
        }
        t_thrd.walsender_cxt.WalSndCtl->most_available_sync = false;
        t_thrd.walsender_cxt.WalSndCtl->sync_master_standalone = false;
        t_thrd.walsender_cxt.WalSndCtl->keep_sync_window_start = 0;
        t_thrd.walsender_cxt.WalSndCtl->out_keep_sync_window = false;
        t_thrd.walsender_cxt.WalSndCtl->demotion = NoDemote;
        SpinLockInit(&t_thrd.walsender_cxt.WalSndCtl->mutex);
    }
}

/* Wake up all walsenders */
void WalSndWakeup(void)
{
    int i;

    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++)
        SetLatch(&t_thrd.walsender_cxt.WalSndCtl->walsnds[i].latch);
}

/* return true if any standby(except dummy standby) caught up primary */
static bool WalSndCaughtup(void)
{
    int i;
    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];

        SpinLockAcquire(&walsnd->mutex);

        if (walsnd->pid != 0 && walsnd->sendRole == SNDROLE_PRIMARY_STANDBY && walsnd->state == WALSNDSTATE_STREAMING) {
            SpinLockRelease(&walsnd->mutex);

            return true;
        }

        SpinLockRelease(&walsnd->mutex);
    }

    return false;
}

/* return true if standby has flush more xlog than dummy standby */
static bool WalSndDummyLEStandby(void)
{
    XLogRecPtr flushDummy = InvalidXLogRecPtr;
    XLogRecPtr flushStandby = InvalidXLogRecPtr;
    int i;

    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];

        SpinLockAcquire(&walsnd->mutex);

        if (walsnd->pid != 0 && walsnd->sendRole == SNDROLE_PRIMARY_STANDBY) {
            flushStandby = walsnd->flush;
        } else if (walsnd->pid != 0 && walsnd->sendRole == SNDROLE_PRIMARY_DUMMYSTANDBY) {
            flushDummy = walsnd->flush;
        }

        SpinLockRelease(&walsnd->mutex);
    }

    if (XLByteEQ(flushDummy, InvalidXLogRecPtr) || XLByteEQ(flushStandby, InvalidXLogRecPtr))
        return true;

    return XLByteLE(flushDummy, flushStandby);
}

/* check if there is any wal sender alive. */
bool WalSndInProgress(int type)
{
    int i;

    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];

        SpinLockAcquire(&walsnd->mutex);

        if (walsnd->pid != 0 && walsnd->pid != t_thrd.proc_cxt.MyProcPid &&
            ((walsnd->sendRole & type) == walsnd->sendRole)) {
            SpinLockRelease(&walsnd->mutex);

            return true;
        }

        SpinLockRelease(&walsnd->mutex);
    }

    return false;
}

/* check if there is quorum wal sender in type status. */
bool WalSndQuorumInProgress(int type)
{
    int i;
    int* nums = (int*)palloc0(t_thrd.syncrep_cxt.SyncRepConfigGroups * sizeof(int));

    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];
        SpinLockAcquire(&walsnd->mutex);
        if (walsnd->pid != 0 && walsnd->pid != t_thrd.proc_cxt.MyProcPid &&
            ((walsnd->sendRole & type) == walsnd->sendRole)) {
            nums[walsnd->sync_standby_group]++;
        }
        SpinLockRelease(&walsnd->mutex);
    }

    for (i = 0; i < t_thrd.syncrep_cxt.SyncRepConfigGroups; i++) {
        if (t_thrd.syncrep_cxt.SyncRepConfig[i]->num_sync > nums[i]) {
            pfree(nums);
            return false;
        }
    }
    pfree(nums);
    return true;
}

bool WalSndAllInProgressForMainStandby(int type)
{
    int i;
    int num = 0;
    int allNum = 0;
    for (i = 1; i < MAX_REPLNODE_NUM; i++) {
        ReplConnInfo *replConnInfo = NULL;
        replConnInfo = t_thrd.postmaster_cxt.ReplConnArray[i];
        if (replConnInfo != NULL && replConnInfo->isCascade) {
            allNum++;
        }
    }
    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];
        SpinLockAcquire(&walsnd->mutex);
        if (walsnd->pid != 0 && walsnd->pid != t_thrd.proc_cxt.MyProcPid &&
            ((walsnd->sendRole & type) == walsnd->sendRole) &&
            walsnd->sentPtr > 0) {
            num++;
        }
        SpinLockRelease(&walsnd->mutex);
    }
    if (num >= allNum) {
        return true;
    } else {
        return false;
    }
}

/* check if there is all wal sender in type status. */
bool WalSndAllInProgress(int type)
{
    int i;
    int num = 0;
    int allNum = 0;

    for (i = 1; i < DOUBLE_MAX_REPLNODE_NUM; i++) {
        ReplConnInfo *replConnInfo = NULL;
        if (i >= MAX_REPLNODE_NUM) {
            replConnInfo = t_thrd.postmaster_cxt.CrossClusterReplConnArray[i - MAX_REPLNODE_NUM];
        } else {
            replConnInfo = t_thrd.postmaster_cxt.ReplConnArray[i];
        }
        if (t_thrd.postmaster_cxt.HaShmData->is_cross_region) {
            /* In streaming primary cluster, there is no cascade standby, the isCascade(true)
               is used when it becomes streaming disaster standby cluster */
            if (replConnInfo != NULL && !replConnInfo->isCrossRegion) {
                allNum++;
            }
        } else {
            /* not contains cascade standby in primary */
            if (replConnInfo != NULL && !replConnInfo->isCascade) {
                allNum++;
            }
        }
    }
    /* contain the only one main standby for streaming disaster cluster */
    if (t_thrd.postmaster_cxt.HaShmData->is_cross_region) {
        allNum++;
    }

    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];
        SpinLockAcquire(&walsnd->mutex);
        if (walsnd->pid != 0 && walsnd->pid != t_thrd.proc_cxt.MyProcPid &&
            ((walsnd->sendRole & type) == walsnd->sendRole) &&
            walsnd->sentPtr > 0) {
            num++;
        }
        SpinLockRelease(&walsnd->mutex);
    }

    if (num >= allNum) {
        return true;
    } else {
        ereport(WARNING,
            (errmsg("The number of walsender %d is less than the number of valid replconninfo %d.", num, allNum)));
        return false;
    }
}

/*
 * Check if there is any standby or secondeary alive through walsnd.
 */
void StandbyOrSecondaryIsAlive(void)
{
    /*
     * When the standby promote to primary wrongfully, and the old primary is
     * alive, the new primary maybe overwrite the same name file on the dfs;
     * At this moment, only one primary that the secondary is connected can
     * commit transaction, so another primary that no standby or secondary is
     * connected will report an ERROR to rollback transaction.
     */
    if (!(t_thrd.postmaster_cxt.HaShmData->current_mode == NORMAL_MODE ||
          WalSndInProgress(SNDROLE_PRIMARY_STANDBY | SNDROLE_PRIMARY_DUMMYSTANDBY)))
        ereport(LOG, (errmsg("No standby or secondary is connected, a new dfs file "
                             "can not be created")));
}

/* Set state for current walsender (only called in walsender) */
void WalSndSetState(WalSndState state)
{
    /* use volatile pointer to prevent code rearrangement */
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

    Assert(AM_WAL_SENDER);

    if (walsnd->state == state)
        return;

    SpinLockAcquire(&walsnd->mutex);
    walsnd->state = state;
    if (state == WALSNDSTATE_CATCHUP)
        walsnd->catchupTime[0] = GetCurrentTimestamp();
    else if (state == WALSNDSTATE_STREAMING)
        walsnd->catchupTime[1] = GetCurrentTimestamp();
    SpinLockRelease(&walsnd->mutex);
}

/*
 * Return a string constant representing the state. This is used
 * in system views, and should *not* be translated.
 */
static const char *WalSndGetStateString(WalSndState state)
{
    switch (state) {
        case WALSNDSTATE_STARTUP:
            return "Startup";
        case WALSNDSTATE_BACKUP:
            return "Backup";
        case WALSNDSTATE_CATCHUP:
            return "Catchup";
        case WALSNDSTATE_STREAMING:
            return "Streaming";
    }
    return "Unknown";
}

static void set_xlog_location(ServerMode local_role, XLogRecPtr* sndWrite, XLogRecPtr* sndFlush, XLogRecPtr* sndReplay){
    if (local_role == PRIMARY_MODE) {
        *sndFlush = GetFlushRecPtr();
        *sndWrite = GetXLogWriteRecPtr();
        *sndReplay = *sndFlush;
    } else {
        *sndReplay = GetXLogReplayRecPtr(NULL);
        *sndFlush = GetStandbyFlushRecPtr(NULL);
        *sndWrite = GetWalRcvWriteRecPtr(NULL);
    }
}

Datum get_paxos_replication_info(PG_FUNCTION_ARGS)
{
    unsigned int paxosReplicaInfoTotal = 6;

    TupleDesc tupdesc = NULL;
    Tuplestorestate *tupstore = NULL;

    XLogRecPtr paxosWrite = InvalidXLogRecPtr;
    XLogRecPtr paxosCommit = InvalidXLogRecPtr;
    XLogRecPtr localWrite = InvalidXLogRecPtr;
    XLogRecPtr localFlush = InvalidXLogRecPtr;
    XLogRecPtr localReplay = InvalidXLogRecPtr;

    Datum values[paxosReplicaInfoTotal];
    bool nulls[paxosReplicaInfoTotal];

    char location[MAXFNAMELEN] = {0};
    char *replicInfo = nullptr;

    int ret = 0;
    int j = 0;
    errno_t rc = EOK;

    rc = memset_s(nulls, sizeof(nulls), 0, sizeof(nulls));
    securec_check(rc, "\0", "\0");

    ServerMode local_role = UNKNOWN_MODE;
    volatile HaShmemData* hashmdata = t_thrd.postmaster_cxt.HaShmData;

    SpinLockAcquire(&hashmdata->mutex);
    local_role = hashmdata->current_mode;
    SpinLockRelease(&hashmdata->mutex);

    set_xlog_location(local_role, &localWrite, &localFlush, &localReplay);

    tupstore = BuildTupleResult(fcinfo, &tupdesc);

    if (!superuser() && !(isOperatoradmin(GetUserId()) && u_sess->attr.attr_security.operation_mode) &&
        !is_member_of_role(GetUserId(), DEFAULT_ROLE_REPLICATION)) {
        /*
         * Only superusers can see details. Other users only get the pid
         * value to know it's a receiver, but no details.
         */
        rc = memset_s(nulls, sizeof(nulls), 1, sizeof(nulls));
        securec_check(rc, "\0", "\0");
    } else {

#ifndef ENABLE_MULTIPLE_NODES
        /* paxos_commit_location */
        if (local_role == PRIMARY_MODE)
            paxosCommit = GetPaxosConsensusRecPtr();
#endif
        if (local_role == STANDBY_MODE)
            paxosCommit = localWrite;

#ifndef ENABLE_MULTIPLE_NODES
        /* paxos_write_location */
        if (local_role == PRIMARY_MODE)
            paxosWrite = GetPaxosWriteRecPtr();
#endif
        if (local_role == STANDBY_MODE)
            paxosWrite = localWrite;

        ret = snprintf_s(location, sizeof(location), sizeof(location) - 1,
                         "%X/%X", static_cast<uint32>(paxosWrite >> 32), static_cast<uint32>(paxosWrite));
        securec_check_ss(ret, "\0", "\0");
        values[j++] = CStringGetTextDatum(location);

        ret = snprintf_s(location, sizeof(location), sizeof(location) - 1,
                         "%X/%X", static_cast<uint32>(paxosCommit >> 32), static_cast<uint32>(paxosCommit));
        securec_check_ss(ret, "\0", "\0");
        values[j++] = CStringGetTextDatum(location);

        /* local_write_location */
        ret = snprintf_s(location, sizeof(location), sizeof(location) - 1,
                         "%X/%X", static_cast<uint32>(localWrite >> 32), static_cast<uint32>(localWrite));
        securec_check_ss(ret, "\0", "\0");
        values[j++] = CStringGetTextDatum(location);

        /* local_flush_location */
        ret = snprintf_s(location, sizeof(location), sizeof(location) - 1,
                         "%X/%X", static_cast<uint32>(localFlush >> 32), static_cast<uint32>(localFlush));
        securec_check_ss(ret, "\0", "\0");
        values[j++] = CStringGetTextDatum(location);

        /* local_replay_location */
        ret = snprintf_s(location, sizeof(location), sizeof(location) - 1,
                         "%X/%X", static_cast<uint32>(localReplay >> 32), static_cast<uint32>(localReplay));
        securec_check_ss(ret, "\0", "\0");
        values[j++] = CStringGetTextDatum(location);


        replicInfo = static_cast<char*>(palloc0(DCF_MAX_STREAM_INFO_LEN * sizeof(char)));
#ifndef ENABLE_MULTIPLE_NODES
        if (g_instance.attr.attr_storage.dcf_attr.enable_dcf && t_thrd.dcf_cxt.dcfCtxInfo->isDcfStarted)
            dcf_query_stream_info(1, replicInfo, DCF_MAX_STREAM_INFO_LEN * sizeof(char));
#endif

        /* DCF replication information */
        values[j] = CStringGetTextDatum(replicInfo);
    }

    tuplestore_putvalues(tupstore, tupdesc, values, nulls);

    /* clean up and return the tuplestore */
    tuplestore_donestoring(tupstore);

    /* free space for parseResult */
    if (replicInfo != nullptr)
        pfree(replicInfo);

    return (Datum) 0;
}

/*
 * Returns activity of DCF replication.
 * Mainly shows xlog location which a standby has written, flushed, committed and replayed.
 */
Datum gs_paxos_stat_replication(PG_FUNCTION_ARGS)
{
    if (!g_instance.attr.attr_storage.dcf_attr.enable_dcf) {
        ereport(ERROR,
                (errmodule(MOD_DCF),
                errcode(ERRCODE_FEATURE_NOT_SUPPORTED),
                errmsg("Un-support feature"),
                errdetail("DCF mode support only")));
        PG_RETURN_NULL();
    }
#ifndef ENABLE_MULTIPLE_NODES
    const int NODE_INFO_COLS = 16;
    const int DCF_ROLE_LEN = 64;
    TupleDesc tupdesc;
    Tuplestorestate *tupstore = nullptr;
    volatile HaShmemData *hashmdata = t_thrd.postmaster_cxt.HaShmData;
    tupstore = BuildTupleResult(fcinfo, &tupdesc);
    char localDCFRole[DCF_ROLE_LEN] = {0};
    char localDCFIP[IP_LEN] = {0};
    int localDCFPort = 0;
    int localNodeID = g_instance.attr.attr_storage.dcf_attr.dcf_node_id;
    /* Parse dcf_config to a json format to get dcf role, ip and port of every nodes */
    cJSON *nodeInfos = nullptr;
    const cJSON *nodeJsons = nullptr;
    if (!GetNodeInfos(&nodeInfos)) {
        cJSON_Delete(nodeInfos);
        ereport(ERROR, (errmodule(MOD_DCF), errmsg("Parse dcf info failed!")));
    } else {
        nodeJsons = cJSON_GetObjectItem(nodeInfos, "nodes");
        if (nodeJsons == nullptr) {
            cJSON_Delete(nodeInfos);
            ereport(ERROR, (errmodule(MOD_DCF), errmsg("Get nodes info failed!")));
        }
        if (!GetDCFNodeInfo(nodeJsons, localNodeID, localDCFRole, DCF_ROLE_LEN, localDCFIP, IP_LEN, &localDCFPort)) {
            cJSON_Delete(nodeInfos);
            ereport(ERROR, (errmodule(MOD_DCF), errmsg("Get dcf role, ip and port of local node failed!")));
        }
    }
    for (int i = 0; i < DCF_MAX_NODES; i++) {
        bool isMember = t_thrd.dcf_cxt.dcfCtxInfo->nodes_info[i].isMember;
        if (!isMember) {
            continue;
        }
        Datum values[NODE_INFO_COLS];
        bool nulls[NODE_INFO_COLS];
        int j = 0;
        errno_t rc = 0;
        int ret = 0;
        rc = memset_s(nulls, sizeof(nulls), 0, sizeof(nulls));
        securec_check(rc, "\0", "\0");

        if (!superuser() && !(isOperatoradmin(GetUserId()) && u_sess->attr.attr_security.operation_mode) &&
            !isMonitoradmin(GetUserId())) {
            /*
             * Only superusers can see details. Other users only get the pid
             * value to know it's a walsender, but no details.
             */
            rc = memset_s(&nulls[j], NODE_INFO_COLS - j, true, NODE_INFO_COLS - j);
            securec_check(rc, "", "");
        } else {
            char location[MAXFNAMELEN] = {0};
            uint32 nodeID = t_thrd.dcf_cxt.dcfCtxInfo->nodes_info[i].nodeID;
            XLogRecPtr write = t_thrd.dcf_cxt.dcfCtxInfo->nodes_info[i].write;
            XLogRecPtr commit = write;
            XLogRecPtr flush = t_thrd.dcf_cxt.dcfCtxInfo->nodes_info[i].flush;
            XLogRecPtr apply = t_thrd.dcf_cxt.dcfCtxInfo->nodes_info[i].apply;
            ServerMode peerRole = t_thrd.dcf_cxt.dcfCtxInfo->nodes_info[i].peer_role;
            DbState peerState = t_thrd.dcf_cxt.dcfCtxInfo->nodes_info[i].peer_state;
            XLogRecPtr syncStart;
            XLogRecPtr sndWrite, sndFlush;
            XLogRecPtr sndCommit;
            XLogRecPtr sndReplay;
            ServerMode localRole;
            int dcfRunMode = u_sess->attr.attr_storage.dcf_attr.dcf_run_mode;
            char peerDCFRole[DCF_ROLE_LEN] = {0};
            char peerDCFIP[IP_LEN] = {0};
            int peerDCFPort = 0;
            if (!GetDCFNodeInfo(nodeJsons, nodeID, peerDCFRole, DCF_ROLE_LEN, peerDCFIP, IP_LEN, &peerDCFPort)) {
                cJSON_Delete(nodeInfos);
                ereport(ERROR, (errmodule(MOD_DCF), errmsg("Get dcf role, ip and port of local node failed!")));
            }
            int syncPercent = 0;
            /* local role */
            SpinLockAcquire(&hashmdata->mutex);
            localRole = hashmdata->current_mode;
            SpinLockRelease(&hashmdata->mutex);
            sndFlush = GetFlushRecPtr();
            sndReplay = sndFlush;
            sndCommit = GetPaxosConsensusRecPtr();
            sndWrite = GetPaxosWriteRecPtr();

            /* local role */
            values[j++] = CStringGetTextDatum(wal_get_role_string(localRole));

            /* peer role */
            values[j++] = CStringGetTextDatum(wal_get_role_string(peerRole));

            /* local dcf role */
            values[j++] = CStringGetTextDatum(localDCFRole);
            /* peer dcf role */
            values[j++] = CStringGetTextDatum(peerDCFRole);
            /* peer_state */
            values[j++] = CStringGetTextDatum(wal_get_db_state_string(peerState));
            /* sender write location */
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X",
                             (uint32)(sndWrite >> 32), (uint32)sndWrite);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);
            /* sender commit location */
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X",
                             (uint32)(sndCommit >> 32), (uint32)sndCommit);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* sender flush location */
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X",
                             (uint32)(sndFlush >> 32), (uint32)sndFlush);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* sender replay location */
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X",
                             (uint32)(sndReplay >> 32), (uint32)sndReplay);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* peer write location */
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X",
                             (uint32)(write >> 32), (uint32)write);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);
            /* peer commit location */
            /* peer commit location equals write location */
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X",
                             (uint32)(commit >> 32), (uint32)commit);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* peer flush location */
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X",
                             (uint32)(flush >> 32), (uint32)flush);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* peer replay location */
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X",
                             (uint32)(apply >> 32), (uint32)apply);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);
            /* sync_percent */
            uint64 coundWindow = ((uint64)WalGetSyncCountWindow() * XLogSegSize);
            if (XLogDiff(sndFlush, flush) < coundWindow) {
                syncStart = InvalidXLogRecPtr;
            } else {
                syncStart = flush;
            }
            syncPercent = GetSyncPercent(syncStart, sndFlush, flush);
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%d%%", syncPercent);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* dcf run mode */
            values[j++] = Int32GetDatum(dcfRunMode);
            /* channel */
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%s:%d-->%s:%d",
                             localDCFIP, localDCFPort, peerDCFIP, peerDCFPort);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);
        }
        tuplestore_putvalues(tupstore, tupdesc, values, nulls);
    }
    /* clean up and return the tuplestore */
    cJSON_Delete(nodeInfos);
    tuplestore_donestoring(tupstore);
#endif
    return (Datum)0;
}

/*
 * Returns activity of walsenders, including pids and xlog locations sent to
 * standby servers.
 */
Datum pg_stat_get_wal_senders(PG_FUNCTION_ARGS)
{
#define PG_STAT_GET_WAL_SENDERS_COLS 21

    TupleDesc tupdesc;
    int *sync_priority = NULL;
    int i = 0;
    volatile HaShmemData *hashmdata = t_thrd.postmaster_cxt.HaShmData;
    SyncRepStandbyData *sync_standbys;
    int num_standbys;

    Tuplestorestate *tupstore = BuildTupleResult(fcinfo, &tupdesc);

    if (IS_DN_DUMMY_STANDYS_MODE()) {
        /*
         * Get the priorities of sync standbys all in one go, to minimise lock
         * acquisitions and to allow us to evaluate who is the current sync
         * standby. This code must match the code in SyncRepReleaseWaiters().
         */
        sync_priority = (int *)palloc(sizeof(int) * g_instance.attr.attr_storage.max_wal_senders);
        for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
            /* use volatile pointer to prevent code rearrangement */
            volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];

            if (walsnd->pid != 0) {
                /*
                 * Treat a standby such as a pg_basebackup background process
                 * which always returns an invalid flush location, as an
                 * asynchronous standby.
                 */
                sync_priority[i] = XLogRecPtrIsInvalid(walsnd->flush) ? 0 : walsnd->sync_standby_priority;
            }
        }
    }

    /*
     * Get the currently active synchronous standbys.This could be out of
     * date before we're done, but we'll use the data anyway.
     */
    num_standbys = SyncRepGetSyncStandbys(&sync_standbys);

    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];
        char location[MAXFNAMELEN * 3] = {0};
        XLogRecPtr sentRecPtr, local_write;
        XLogRecPtr flush, apply;
        WalSndState state;
        XLogRecPtr sndWrite, sndFlush;
        XLogRecPtr sndReplay, RcvReceived;
        XLogRecPtr syncStart;

        int sync_percent = 0;
        ServerMode peer_role;
        SndRole snd_role;
        DbState peer_state;
        ServerMode local_role;
        char localip[IP_LEN] = {0};
        char remoteip[IP_LEN] = {0};
        TimestampTz catchup_time[2];
        int localport = 0;
        int remoteport = 0;
        Datum values[PG_STAT_GET_WAL_SENDERS_COLS];
        bool nulls[PG_STAT_GET_WAL_SENDERS_COLS];
        int j = 0;
        int k = 0;
        errno_t rc = 0;
        int ret = 0;
        int group = 0;
        int priority = 0;

        bool is_sync_standby = false;

        SpinLockAcquire(&hashmdata->mutex);
        local_role = hashmdata->current_mode;
        if (walsnd->pid == 0 || walsnd->lwpId == 0) {
            SpinLockRelease(&hashmdata->mutex);
            continue;
        }
        SpinLockRelease(&hashmdata->mutex);
        SpinLockAcquire(&walsnd->mutex);

        localport = walsnd->wal_sender_channel.localport;
        remoteport = walsnd->wal_sender_channel.remoteport;
        rc = strncpy_s(localip, IP_LEN, (char *)walsnd->wal_sender_channel.localhost, IP_LEN - 1);
        securec_check(rc, "\0", "\0");
        rc = strncpy_s(remoteip, IP_LEN, (char *)walsnd->wal_sender_channel.remotehost, IP_LEN - 1);
        securec_check(rc, "\0", "\0");
        localip[IP_LEN - 1] = '\0';
        remoteip[IP_LEN - 1] = '\0';
        peer_role = walsnd->peer_role;
        snd_role = walsnd->sendRole;
        peer_state = walsnd->peer_state;
        state = walsnd->state;
        sentRecPtr = walsnd->sentPtr;
        local_write = walsnd->write;
        flush = walsnd->flush;
        apply = walsnd->apply;
        RcvReceived = walsnd->receive;
        syncStart = walsnd->syncPercentCountStart;
        catchup_time[0] = walsnd->catchupTime[0];
        catchup_time[1] = walsnd->catchupTime[1];
        if (IS_DN_MULTI_STANDYS_MODE()) {
            group = walsnd->sync_standby_group;
            priority = walsnd->sync_standby_priority;
        }
        SpinLockRelease(&walsnd->mutex);

        set_xlog_location(local_role, &sndWrite, &sndFlush, &sndReplay);

        if (IS_SHARED_STORAGE_MODE && !AM_WAL_HADR_SENDER) {
            ShareStorageXLogCtl *ctlInfo = AlignAllocShareStorageCtl();
            ReadShareStorageCtlInfo(ctlInfo);
            sentRecPtr = ctlInfo->insertHead;
            sndWrite = ctlInfo->insertHead;
            sndFlush = ctlInfo->insertHead;
            sndReplay = ctlInfo->insertHead;
            AlignFreeShareStorageCtl(ctlInfo);
        }

        if (SS_REPLICATION_DORADO_CLUSTER && !AM_WAL_HADR_SENDER) {
            ReadSSDoradoCtlInfoFile();
            ShareStorageXLogCtl *ctlInfo = g_instance.xlog_cxt.ssReplicationXLogCtl;
            sentRecPtr = ctlInfo->insertHead;
            sndWrite = ctlInfo->insertHead;
            sndFlush = ctlInfo->insertHead;
            sndReplay = ctlInfo->insertHead;
        }

        /*
         * if the walsener's pid has changed,we consider is is not a sync standby
         */
        for(k = 0; k < num_standbys; k++) {
            if(sync_standbys[k].walsnd_index == i
                && sync_standbys[k].pid == walsnd->pid
                && sync_standbys[k].lwpId == walsnd->lwpId) {
                is_sync_standby = true;
                break;
            }
        }

        rc = memset_s(nulls, sizeof(nulls), 0, sizeof(nulls));
        securec_check(rc, "\0", "\0");

        values[j++] = Int64GetDatum(walsnd->pid);
        values[j++] = Int32GetDatum(walsnd->lwpId);

        if (!superuser() && !(isOperatoradmin(GetUserId()) && u_sess->attr.attr_security.operation_mode) &&
            !isMonitoradmin(GetUserId())) {
            /*
             * Only superusers can see details. Other users only get the pid
             * value to know it's a walsender, but no details.
             */
            rc = memset_s(&nulls[j], PG_STAT_GET_WAL_SENDERS_COLS - j, true, PG_STAT_GET_WAL_SENDERS_COLS - j);
            securec_check(rc, "", "");
        } else {
            /* local_role */
            values[j++] = CStringGetTextDatum(wal_get_role_string(local_role));

            /* peer_role */
            if (snd_role == SNDROLE_PRIMARY_DUMMYSTANDBY)
                values[j++] = CStringGetTextDatum("Secondary");
            else {
                if (peer_role != STANDBY_CLUSTER_MODE) {
                    if (t_thrd.postmaster_cxt.HaShmData->current_mode == STANDBY_MODE) {
                        values[j++] = CStringGetTextDatum("Cascade Standby");
                    } else {
                        values[j++] = CStringGetTextDatum("Standby");
                    }
                } else {
                    values[j++] = CStringGetTextDatum("StandbyCluster_Standby");
                }
            }

            /* peer_state */
            values[j++] = CStringGetTextDatum(wal_get_db_state_string(peer_state));

            /* state */
            values[j++] = CStringGetTextDatum(WalSndGetStateString(state));

            /* catchup time */
            if (catchup_time[0] != 0)
                values[j++] = TimestampTzGetDatum(catchup_time[0]);
            else
                nulls[j++] = true;
            if (catchup_time[1] != 0 && (state != WALSNDSTATE_CATCHUP))
                values[j++] = TimestampTzGetDatum(catchup_time[1]);
            else
                nulls[j++] = true;

            /* sender_sent_location */
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X", (uint32)(sentRecPtr >> 32),
                             (uint32)sentRecPtr);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* sender_write_location */
            if (sndWrite == 0)
                SETXLOGLOCATION(sndWrite, sentRecPtr)
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X", (uint32)(sndWrite >> 32),
                             (uint32)sndWrite);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* sender_flush_location */
            if (sndFlush == 0)
                SETXLOGLOCATION(sndFlush, sentRecPtr)
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X", (uint32)(sndFlush >> 32),
                             (uint32)sndFlush);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* sender_replay_location */
            if (sndReplay == 0)
                SETXLOGLOCATION(sndReplay, sentRecPtr)
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X", (uint32)(sndReplay >> 32),
                             (uint32)sndReplay);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* receiver_received_location */
            if (RcvReceived == 0)
                SETXLOGLOCATION(RcvReceived, sentRecPtr)
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X", (uint32)(RcvReceived >> 32),
                             (uint32)RcvReceived);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* receiver_write_location */
            if (local_write == 0)
                SETXLOGLOCATION(local_write, sentRecPtr)
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X", (uint32)(local_write >> 32),
                             (uint32)local_write);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* receiver_flush_location */
            if (flush == 0)
                SETXLOGLOCATION(flush, sentRecPtr)
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X", (uint32)(flush >> 32),
                             (uint32)flush);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* receiver_replay_location */
            if (apply == 0)
                SETXLOGLOCATION(apply, sentRecPtr)
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%X/%X", (uint32)(apply >> 32),
                             (uint32)apply);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            /* sync_percent */
            sync_percent = GetSyncPercent(syncStart, sndFlush, flush);
            ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%d%%", sync_percent);
            securec_check_ss(ret, "\0", "\0");
            values[j++] = CStringGetTextDatum(location);

            if (IS_DN_DUMMY_STANDYS_MODE()) {
                /* sync_state and sync_prority */
                if (!SyncRepRequested()) {
                    values[j++] = CStringGetTextDatum("Async");
                    values[j++] = Int32GetDatum(0);
                } else {
                    values[j++] = CStringGetTextDatum("Sync");
                    values[j++] = Int32GetDatum(sync_priority[i]);
                }
            } else {
                /*
                 * Treat a standby such as a pg_basebackup background process
                 * which always returns an invalid flush location, as an
                 * asynchronous standby.
                 */
                priority = XLogRecPtrIsInvalid(walsnd->flush) ? 0 : priority;
                /*
                 * More easily understood version of standby state. This is purely
                 * informational.
                 * In quorum-based sync replication, the role of each standby
                 * listed in synchronous_standby_names can be changing very
                 * frequently. Any standbys considered as "sync" at one moment can
                 * be switched to "potential" ones at the next moment. So, it's
                 * basically useless to report "sync" or "potential" as their sync
                 * states. We report just "quorum" for them.
                 */
                if (priority == 0) {
                    values[j++] = CStringGetTextDatum("Async");
                } else if (is_sync_standby) {
                    values[j++] = GetWalsndSyncRepConfig(walsnd)->syncrep_method == SYNC_REP_PRIORITY
                                        ? CStringGetTextDatum("Sync")
                                        : CStringGetTextDatum("Quorum");
                } else {
                    values[j++] = CStringGetTextDatum("Potential");
                }
                values[j++] = Int32GetDatum(priority);
            }

            if (most_available_sync)
                values[j++] = CStringGetTextDatum("On");
            else
                values[j++] = CStringGetTextDatum("Off");

            /* channel */
            if (strlen(localip) == 0 || strlen(remoteip) == 0 || localport == 0 || remoteport == 0) {
                location[0] = '\0';
            } else {
                ret = snprintf_s(location, sizeof(location), sizeof(location) - 1, "%s:%d-->%s:%d",
                                 localip, localport, remoteip, remoteport);
                securec_check_ss(ret, "\0", "\0");
            }
            values[j++] = CStringGetTextDatum(location);
        }

        tuplestore_putvalues(tupstore, tupdesc, values, nulls);
    }

    if (sync_standbys != NULL) {
        pfree(sync_standbys);
        sync_standbys = NULL;
    }

    if (sync_priority != NULL) {
        pfree(sync_priority);
        sync_priority = NULL;
    }

    /* clean up and return the tuplestore */
    tuplestore_donestoring(tupstore);

    return (Datum)0;
}

/*
 * Send a keepalive message to standby.
 *
 * If requestReply is set, the message requests the other party to send
 * a message back to us, for heartbeat purposes.  We also set a flag to
 * let nearby code know that we're waiting for that response, to avoid
 * repeated requests.
 */
static void WalSndKeepalive(bool requestReply)
{
    PrimaryKeepaliveMessage keepalive_message;
    volatile HaShmemData *hashmdata = t_thrd.postmaster_cxt.HaShmData;
    errno_t errorno = EOK;
    /* Construct a new message */
    SpinLockAcquire(&hashmdata->mutex);
    keepalive_message.peer_role = hashmdata->current_mode;
    SpinLockRelease(&hashmdata->mutex);
    keepalive_message.peer_state = get_local_dbstate();
    keepalive_message.walEnd = t_thrd.walsender_cxt.sentPtr;
    keepalive_message.sendTime = GetCurrentTimestamp();
    keepalive_message.replyRequested = requestReply;
    keepalive_message.catchup = (t_thrd.walsender_cxt.MyWalSnd->state == WALSNDSTATE_CATCHUP);

    ereport(((requestReply && AM_WAL_DB_SENDER) ? LOG : DEBUG2), (errmsg("sending wal replication keepalive")));

    /* Prepend with the message type and send it. */
    t_thrd.walsender_cxt.output_xlog_message[0] = 'k';
    errorno = memcpy_s(t_thrd.walsender_cxt.output_xlog_message + 1,
                       sizeof(WalDataMessageHeader) + g_instance.attr.attr_storage.MaxSendSize * 1024,
                       &keepalive_message, sizeof(PrimaryKeepaliveMessage));
    securec_check(errorno, "\0", "\0");
    (void)pq_putmessage_noblock('d', t_thrd.walsender_cxt.output_xlog_message, sizeof(PrimaryKeepaliveMessage) + 1);

    /* Flush the keepalive message to standby immediately. */
    if (pq_flush_if_writable() != 0)
        WalSndShutdown();

    /* Set local flag */
    if (requestReply) {
        t_thrd.walsender_cxt.waiting_for_ping_response = true;
    }
}

/*
 * This function is used to send rm_xlog message to  xlogreceiver.
 * If requestReply is set, sets a flag in the message requesting the standby
 * to send a message back to us, for heartbeat purposes.
 */
static void WalSndRmXLog(bool requestReply)
{
    RmXLogMessage rmXLogMessage;
    volatile HaShmemData *hashmdata = t_thrd.postmaster_cxt.HaShmData;
    errno_t errorno = EOK;

    /* Construct a new message */
    SpinLockAcquire(&hashmdata->mutex);
    rmXLogMessage.peer_role = hashmdata->current_mode;
    SpinLockRelease(&hashmdata->mutex);
    rmXLogMessage.peer_state = get_local_dbstate();
    rmXLogMessage.sendTime = GetCurrentTimestamp();
    rmXLogMessage.replyRequested = requestReply;

    ereport(DEBUG2, (errmsg("sending dummystandby rm xlog message")));

    /* Prepend with the message type and send it. */
    t_thrd.walsender_cxt.output_xlog_message[0] = 'x';
    errorno = memcpy_s(t_thrd.walsender_cxt.output_xlog_message + 1, sizeof(WalDataMessageHeader) + WS_MAX_SEND_SIZE,
                       &rmXLogMessage, sizeof(RmXLogMessage));
    securec_check(errorno, "\0", "\0");
    (void)pq_putmessage_noblock('d', t_thrd.walsender_cxt.output_xlog_message, sizeof(RmXLogMessage) + 1);
}

/*
 * This function is used to send rm_xlog message to  xlogreceiver.
 * If requestReply is set, sets a flag in the message requesting the standby
 * to send a message back to us, for heartbeat purposes.
 */
static void WalSndSyncDummyStandbyDone(bool requestReply)
{
    EndXLogMessage endXLogMessage;
    volatile HaShmemData *hashmdata = t_thrd.postmaster_cxt.HaShmData;
    errno_t errorno = EOK;

    /* Construct a new message */
    SpinLockAcquire(&hashmdata->mutex);
    endXLogMessage.peer_role = hashmdata->current_mode;
    SpinLockRelease(&hashmdata->mutex);
    endXLogMessage.peer_state = get_local_dbstate();
    endXLogMessage.sendTime = GetCurrentTimestamp();
    endXLogMessage.percent = SYNC_DUMMY_STANDBY_END;

    ereport(dummyStandbyMode ? LOG : DEBUG2, (errmsg("send Secondary Standby xlog done")));

    /* Prepend with the message type and send it. */
    t_thrd.walsender_cxt.output_xlog_message[0] = 'e';
    errorno = memcpy_s(t_thrd.walsender_cxt.output_xlog_message + 1,
                       sizeof(WalDataMessageHeader) + g_instance.attr.attr_storage.MaxSendSize * 1024, &endXLogMessage,
                       sizeof(EndXLogMessage));
    securec_check(errorno, "\0", "\0");
    (void)pq_putmessage_noblock('d', t_thrd.walsender_cxt.output_xlog_message, sizeof(EndXLogMessage) + 1);
}

static void WalSndKeepaliveIfNecessary(TimestampTz now)
{
    TimestampTz ping_time;
    int timeout = WalSndTimeout();

    /*
     * Don't send keepalive messages if timeouts are globally disabled or
     * we're doing something not partaking in timeouts.
     */
    if (timeout <= 0 || t_thrd.walsender_cxt.last_reply_timestamp <= 0)
        return;

    if (t_thrd.walsender_cxt.waiting_for_ping_response)
        return;

    /*
     * If half of wal_sender_timeout has lapsed without receiving any reply
     * from the standby, send a keep-alive message to the standby requesting
     * an immediate reply.
     */
    ping_time = TimestampTzPlusMilliseconds(t_thrd.walsender_cxt.last_reply_timestamp, timeout / 2);
    if (now >= ping_time) {
        WalSndKeepalive(true);
    }
}

/*
 * send switchover response message
 */
static void WalSndResponseSwitchover(char *msgbuf)
{
    PrimarySwitchResponseMessage response_message;
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    int maxWalSenders = g_instance.attr.attr_storage.max_wal_senders;
    errno_t errorno = EOK;

    if (walsnd == NULL)
        return;

    switch (walsnd->node_state) {
        case NODESTATE_PROMOTE_APPROVE:
            response_message.switchResponse = SWITCHOVER_PROMOTE_REQUEST;
            /* clean view data. */
            int rc;
            rc = memset_s(g_instance.rto_cxt.rto_standby_data, sizeof(RTOStandbyData) * maxWalSenders,
                0, sizeof(RTOStandbyData) * maxWalSenders);
            securec_check(rc, "", "");
#ifndef ENABLE_MULTIPLE_NODES
            rc = memset_s(&(g_instance.rto_cxt.dcf_rto_standby_data), sizeof(RTOStandbyData) * DCF_MAX_NODE_NUM,
                0, sizeof(RTOStandbyData) * DCF_MAX_NODE_NUM);
            securec_check(rc, "", "");
#endif
            break;
        case NODESTATE_PRIMARY_DEMOTING_WAIT_CATCHUP:
            response_message.switchResponse = SWITCHOVER_DEMOTE_CATCHUP_EXIST;
            break;
        case NODESTATE_STANDBY_REDIRECT:
        case NODESTATE_DEMOTE_FAILED:
        default:
            return;
    }

    response_message.walEnd = t_thrd.walsender_cxt.sentPtr;
    response_message.sendTime = GetCurrentTimestamp();

    ereport(LOG,
            (errmsg("sending switchover response message%s",
                    walsnd->node_state == NODESTATE_PRIMARY_DEMOTING_WAIT_CATCHUP ? ", meeting alive catchup" : ".")));

    /* Prepend with the message type and send it. */
    msgbuf[0] = 'p';
    errorno = memcpy_s(msgbuf + 1, sizeof(WalDataMessageHeader) + g_instance.attr.attr_storage.MaxSendSize * 1024,
                       &response_message, sizeof(PrimarySwitchResponseMessage));
    securec_check(errorno, "\0", "\0");
    (void)pq_putmessage_noblock('d', msgbuf, sizeof(PrimarySwitchResponseMessage) + 1);
}

/*
 * send archive xlog command
 */
static void WalSndArchiveXlog(ArchiveXlogMessage *archive_message)
{
    errno_t errorno = EOK;
    ereport(LOG,
        (errmsg("%s : WalSndArchiveXlog %X/%X", archive_message->slot_name,
            (uint32)(archive_message->targetLsn >> 32),
            (uint32)(archive_message->targetLsn))));

    /* Prepend with the message type and send it. */
    t_thrd.walsender_cxt.output_xlog_message[0] = 'a';
    errorno = memcpy_s(t_thrd.walsender_cxt.output_xlog_message + 1,
        sizeof(ArchiveXlogMessage) + WS_MAX_SEND_SIZE,
        archive_message,
        sizeof(ArchiveXlogMessage));
    securec_check(errorno, "\0", "\0");
    (void)pq_putmessage_noblock('d', t_thrd.walsender_cxt.output_xlog_message, sizeof(ArchiveXlogMessage) + 1);
}

/*
 * This isn't currently used for anything. Monitoring tools might be
 * interested in the future, and we'll need something like this in the
 * future for synchronous replication.
 */
#ifdef NOT_USED
/*
 * Returns the oldest Send position among walsenders. Or InvalidXLogRecPtr
 * if none.
 */
XLogRecPtr GetOldestWALSendPointer(void)
{
    XLogRecPtr oldest = 0;
    int i;
    bool found = false;

    for (i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];
        XLogRecPtr recptr;

        if (walsnd->pid == 0)
            continue;

        SpinLockAcquire(&walsnd->mutex);
        recptr = walsnd->sentPtr;
        SpinLockRelease(&walsnd->mutex);

        if (recptr == 0)
            continue;

        if (!found || XLByteLT(recptr, oldest))
            oldest = recptr;
        found = true;
    }
    return oldest;
}

#endif

/*
 * Save the current connect channel of the walsender in walsnd.
 */
static void SetHaWalSenderChannel()
{
    struct sockaddr *laddr = (struct sockaddr *)&(u_sess->proc_cxt.MyProcPort->laddr.addr);
    struct sockaddr *raddr = (struct sockaddr *)&(u_sess->proc_cxt.MyProcPort->raddr.addr);
    char local_ip[IP_LEN] = {0};
    char remote_ip[IP_LEN] = {0};
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    char *result = NULL;
    errno_t rc = 0;

    if (laddr->sa_family == AF_INET6) {
        result = inet_net_ntop(AF_INET6, &((struct sockaddr_in6 *)laddr)->sin6_addr, 128, local_ip, IP_LEN);
        if (result == NULL) {
            ereport(WARNING, (errmsg("inet_net_ntop failed")));
        }
    } else if (laddr->sa_family == AF_INET) {
        result = inet_net_ntop(AF_INET, &((struct sockaddr_in *)laddr)->sin_addr, 32, local_ip, IP_LEN);
        if (result == NULL) {
            ereport(WARNING, (errmsg("inet_net_ntop failed")));
        }
    }

    if (raddr->sa_family == AF_INET6) {
        result = inet_net_ntop(AF_INET6, &((struct sockaddr_in6 *)raddr)->sin6_addr, 128, remote_ip, IP_LEN);
        if (result == NULL) {
            ereport(WARNING, (errmsg("inet_net_ntop failed")));
        }
    } else if (raddr->sa_family == AF_INET) {
        result = inet_net_ntop(AF_INET, &((struct sockaddr_in *)raddr)->sin_addr, 32, remote_ip, IP_LEN);
        if (result == NULL) {
            ereport(WARNING, (errmsg("inet_net_ntop failed")));
        }
    }

    SpinLockAcquire(&walsnd->mutex);
    rc = strncpy_s((char *)walsnd->wal_sender_channel.localhost, IP_LEN, local_ip, IP_LEN - 1);
    securec_check(rc, "\0", "\0");
    walsnd->wal_sender_channel.localhost[IP_LEN - 1] = '\0';

    if (laddr->sa_family == AF_INET6) {
        walsnd->wal_sender_channel.localport = ntohs(((struct sockaddr_in6 *)laddr)->sin6_port);
    } else if (laddr->sa_family == AF_INET) {
        walsnd->wal_sender_channel.localport = ntohs(((struct sockaddr_in *)laddr)->sin_port);
    }
    rc = strncpy_s((char *)walsnd->wal_sender_channel.remotehost, IP_LEN, remote_ip, IP_LEN - 1);
    securec_check(rc, "\0", "\0");
    walsnd->wal_sender_channel.remotehost[IP_LEN - 1] = '\0';

    if (raddr->sa_family == AF_INET6) {
        walsnd->wal_sender_channel.remoteport = ntohs(((struct sockaddr_in6 *)raddr)->sin6_port);
    } else if (raddr->sa_family == AF_INET) {
        walsnd->wal_sender_channel.remoteport = ntohs(((struct sockaddr_in *)raddr)->sin_port);
    }

    SpinLockRelease(&walsnd->mutex);

    if (IS_PGXC_DATANODE) {
        char *standby_name = (char *)(g_instance.rto_cxt.rto_standby_data[walsnd->index].id);
        rc = strncpy_s(standby_name, NODENAMELEN, u_sess->attr.attr_common.application_name,
                       strlen(u_sess->attr.attr_common.application_name));
        securec_check(rc, "\0", "\0");
    }
}

static bool UpdateHaWalSenderChannel(int ha_remote_listen_port)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    bool is_found = false;
    int i = 0;
    char* ipNoZone = NULL;
    char ipNoZoneData[IP_LEN] = {0};

    for (i = 1; i < DOUBLE_MAX_REPLNODE_NUM; i++) {
        ReplConnInfo *replconninfo = nullptr;
        if (i >= MAX_REPLNODE_NUM) {
            replconninfo = t_thrd.postmaster_cxt.CrossClusterReplConnArray[i - MAX_REPLNODE_NUM];
        } else {
            replconninfo = t_thrd.postmaster_cxt.ReplConnArray[i];
        }
        if (replconninfo == NULL)
            continue;

        /* remove any '%zone' part from an IPv6 address string */
        ipNoZone = remove_ipv6_zone(replconninfo->remotehost, ipNoZoneData, IP_LEN);

        if (strncmp((char *)ipNoZone, (char *)walsnd->wal_sender_channel.remotehost, IP_LEN) == 0 &&
            replconninfo->remoteport == ha_remote_listen_port) {
            SpinLockAcquire(&walsnd->mutex);
            walsnd->channel_get_replc = i;
            SpinLockRelease(&walsnd->mutex);
            is_found = true;
            break;
        }
    }

    if (is_found)
        ereport(LOG, (errmsg("current repl of walsender is %d.", i)));

    return is_found;
}

static void SetReplWalSender(void)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

    SpinLockAcquire(&walsnd->mutex);
    walsnd->replSender = true;
    SpinLockRelease(&walsnd->mutex);
}

/* Set walsnd peer_mode */
static void SetWalSndPeerMode(ServerMode mode)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

    SpinLockAcquire(&walsnd->mutex);
    walsnd->peer_role = mode;
    SpinLockRelease(&walsnd->mutex);
}

/* Set walsnd peer_state */
static void SetWalSndPeerDbstate(DbState state)
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

    SpinLockAcquire(&walsnd->mutex);
    walsnd->peer_state = state;
    SpinLockRelease(&walsnd->mutex);
}

/* send config file to standby */
static bool SendConfigFile(char *path)
{
    char *buf = NULL;
    char *temp_buf = nullptr;
    char **opt_lines = nullptr;
    int len = 0;
    int temp_buf_len = 0;
    struct stat statbuf;
    ConfFileLock filelock = { NULL, 0 };
    ConfigModifyTimeMessage msgConfigTime;
    errno_t errorno = EOK;
    bool read_guc_file_success = true;

    if (AmWalSenderToDummyStandby() || AmWalSenderOnDummyStandby())
        return true;

    if (lstat(path, &statbuf) < 0 || statbuf.st_size == 0) {
        ereport(LOG, (errcode_for_file_access(), errmsg("could not stat file or directory \"%s\": %m", path)));
        return false;
    }
    /**
     * Get two locks for config file before making changes, please refer to
     * AlterSystemSetConfigFile() in guc.cpp for detailed explanations.
     */
    if (get_file_lock(t_thrd.walsender_cxt.gucconf_lock_file, &filelock) != CODE_OK) {
        ereport(LOG, (errmsg("get lock failed when send gaussdb config file to the peer.")));
        return false;
    }
    LWLockAcquire(ConfigFileLock, LW_EXCLUSIVE);
    PG_TRY();
    {
    opt_lines = read_guc_file(path);
    }
    PG_CATCH();
    {
        read_guc_file_success = false;
        EmitErrorReport();
        FlushErrorState();
    }
    PG_END_TRY();
    if (!read_guc_file_success) {
        /* if failed to read guc file, will log the error info in PG_CATCH(), no need to log again. */
        release_file_lock(&filelock);
        LWLockRelease(ConfigFileLock);
        return false;
    }
    if (opt_lines == nullptr) {
        release_file_lock(&filelock);
        LWLockRelease(ConfigFileLock);
        ereport(LOG, (errmsg("the config file has no data,please check it.")));
        return false;
    }
    comment_guc_lines(opt_lines, g_reserve_param);
    temp_buf_len = add_guc_optlines_to_buffer(opt_lines, &temp_buf);
    release_opt_lines(opt_lines);
    Assert(temp_buf_len != 0);
    /* temp_buf_len including last byte '\0' */
    len = 1 + sizeof(ConfigModifyTimeMessage) + temp_buf_len;
    buf = (char *)palloc0(len);
    buf[0] = 'm';
    msgConfigTime.config_modify_time = statbuf.st_mtime;
    errorno = memcpy_s(buf + 1, sizeof(ConfigModifyTimeMessage) + temp_buf_len,
                        &msgConfigTime, sizeof(ConfigModifyTimeMessage));
    securec_check(errorno, "\0", "\0");
    errorno = memcpy_s(buf + 1 + sizeof(ConfigModifyTimeMessage), temp_buf_len,
                        temp_buf, temp_buf_len);
    securec_check(errorno, "\0", "\0");
    pfree(temp_buf);
    temp_buf = NULL;
    release_file_lock(&filelock);
    LWLockRelease(ConfigFileLock);
    /* Send the chunk as a CopyData message */
    (void)pq_putmessage_noblock('d', buf, len);
    pfree(buf);
    buf = NULL;
    ereport(LOG, (errmsg("walsender send config file size :%d", len)));
    return true;
}

AlarmCheckResult WalSegmentsRemovedChecker(Alarm *alarm, AlarmAdditionalParam *additionalParam)
{
    if (WalSegmemtRemovedhappened == true) {
        // fill the alarm message
        WriteAlarmAdditionalInfo(additionalParam, g_instance.attr.attr_common.PGXCNodeName, "", "", alarm, ALM_AT_Fault,
                                 g_instance.attr.attr_common.PGXCNodeName);
        return ALM_ACR_Abnormal;
    } else {
        // fill the alarm message
        WriteAlarmAdditionalInfo(additionalParam, g_instance.attr.attr_common.PGXCNodeName, "", "", alarm,
                                 ALM_AT_Resume);
        return ALM_ACR_Normal;
    }
}

void StopAliveBuildSender(void)
{
    for (int i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];
        SndRole sndrole;

        if (walsnd->pid == 0 || t_thrd.walsender_cxt.MyWalSnd == walsnd)
            continue;

        SpinLockAcquire(&walsnd->mutex);
        sndrole = walsnd->sendRole;
        SpinLockRelease(&walsnd->mutex);

        /* skip the last cycle using SIGTERM */
        if (sndrole == SNDROLE_PRIMARY_BUILDSTANDBY)
            (void)gs_signal_send(walsnd->pid, SIGTERM);
    }
}

bool IsAllBuildSenderExit()
{
    for (int i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];
        SndRole sndrole;
        SpinLockAcquire(&walsnd->mutex);
        sndrole = walsnd->sendRole;
        SpinLockRelease(&walsnd->mutex);
        if (sndrole == SNDROLE_PRIMARY_BUILDSTANDBY && walsnd->pid != 0) {
            return false;
        }
    }
    ereport(LOG, (errmsg("all build walsenders exited")));
    return true;
}

void GetFastestReplayStandByServiceAddress(char *fastest_remote_address, char *second_fastest_remote_address,
                                           size_t address_len)
{
    if (fastest_remote_address == NULL || second_fastest_remote_address == NULL || address_len == 0 ||
        t_thrd.walsender_cxt.WalSndCtl == NULL)
        return;

    int fastest = 0;
    int second_fastest = 0;
    XLogRecPtr fastest_replay = InvalidXLogRecPtr;
    XLogRecPtr second_fastest_replay = InvalidXLogRecPtr;

    errno_t rc = EOK;

    for (int i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];

        if (walsnd->pid == 0 || !walsnd->replSender)
            continue;

        SpinLockAcquire(&walsnd->mutex);
        XLogRecPtr walsnd_replay = walsnd->apply;
        DbState peer_state = walsnd->peer_state;
        SpinLockRelease(&walsnd->mutex);

        /* remote can accept connections */
        if (peer_state != NORMAL_STATE && peer_state != CATCHUP_STATE)
            continue;

        if (XLByteLT(second_fastest_replay, walsnd_replay)) {
            if (XLByteLT(fastest_replay, walsnd_replay)) {
                /* walsnd_replay is larger than fastest_replay */
                second_fastest = fastest;
                second_fastest_replay = fastest_replay;

                fastest = i;
                fastest_replay = walsnd_replay;
            } else {
                /* walsnd_replay is in the range (second_fastest_replay, fastest_replay] */
                second_fastest = i;
                second_fastest_replay = walsnd_replay;
            }
        }
    }

    /* find fastest replay standby */
    if (!XLogRecPtrIsInvalid(fastest_replay)) {
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[fastest];
        SpinLockAcquire(&walsnd->mutex);
        rc = snprintf_s(fastest_remote_address, address_len, (address_len - 1), "%s@%d",
                        walsnd->wal_sender_channel.remotehost, walsnd->wal_sender_channel.remoteport);
        SpinLockRelease(&walsnd->mutex);

        securec_check_ss(rc, "", "");
    }

    /* find second fastest replay standby */
    if (!XLogRecPtrIsInvalid(second_fastest_replay)) {
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[second_fastest];
        SpinLockAcquire(&walsnd->mutex);
        rc = snprintf_s(second_fastest_remote_address, address_len, (address_len - 1), "%s@%d",
                        walsnd->wal_sender_channel.remotehost, walsnd->wal_sender_channel.remoteport);
        SpinLockRelease(&walsnd->mutex);

        securec_check_ss(rc, "", "");
    }
}

bool IsPrimaryStandByReadyToRemoteRead(void)
{
    /* only using  IS_DN_DUMMY_STANDYS_MODE && PRIMARY_MODE */
    bool can_remte_read = false;

    for (int i = 0; i < g_instance.attr.attr_storage.max_wal_senders; i++) {
        /* use volatile pointer to prevent code rearrangement */
        volatile WalSnd *walsnd = &t_thrd.walsender_cxt.WalSndCtl->walsnds[i];

        if (walsnd->pid == 0 || t_thrd.walsender_cxt.MyWalSnd == walsnd)
            continue;

        SpinLockAcquire(&walsnd->mutex);
        SndRole sndrole = walsnd->sendRole;
        DbState peer_state = walsnd->peer_state;
        SpinLockRelease(&walsnd->mutex);

        if (sndrole == SNDROLE_PRIMARY_STANDBY) {
            if (peer_state == NORMAL_STATE || peer_state == CATCHUP_STATE) {
                can_remte_read = true;
            }

            break;
        }
    }

    return can_remte_read;
}

static bool IsWalSenderToBuild(void)
{
    WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    bool isWalToBuild = false;
    if (walsnd == NULL) {
        return false;
    }
    SpinLockAcquire(&walsnd->mutex);
    SndRole sndrole = walsnd->sendRole;
    ThreadId pid = walsnd->pid;
    if (sndrole == SNDROLE_PRIMARY_BUILDSTANDBY && pid != 0) {
        isWalToBuild = true;
    }
    SpinLockRelease(&walsnd->mutex);

    return isWalToBuild;
}

/* Set start send lsn for current walsender (only called in walsender) */
static void WalSndSetPercentCountStartLsn(XLogRecPtr startLsn)
{
    /* use volatile pointer to prevent code rearrangement */
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

    SpinLockAcquire(&walsnd->mutex);
    walsnd->syncPercentCountStart = startLsn;
    SpinLockRelease(&walsnd->mutex);
}

/* Set start send lsn for current walsender (only called in walsender) */
static void WalSndRefreshPercentCountStartLsn(XLogRecPtr currentMaxLsn, XLogRecPtr currentDoneLsn)
{
    uint64 coundWindow = ((uint64)WalGetSyncCountWindow() * XLogSegSize);
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    XLogRecPtr baseStartLsn = InvalidXLogRecPtr;

    if (!walsnd) {
        return;
    }

    /* don't refresh during catching up. */
    if (walsnd->state == WALSNDSTATE_CATCHUP) {
        return;
    }

    if (XLogDiff(currentMaxLsn, currentDoneLsn) < coundWindow) {
        WalSndSetPercentCountStartLsn(InvalidXLogRecPtr);
    } else {
        SpinLockAcquire(&walsnd->mutex);
        baseStartLsn = walsnd->syncPercentCountStart;
        SpinLockRelease(&walsnd->mutex);
        if (!XLByteEQ(baseStartLsn, InvalidXLogRecPtr)) {
            return;
        }
        WalSndSetPercentCountStartLsn(currentDoneLsn);
    }
}

XLogSegNo WalGetSyncCountWindow(void)
{
    return (XLogSegNo)(uint32)XLogSegmentsNum(u_sess->attr.attr_storage.wal_keep_segments);
}

void add_archive_task_to_list(int archive_task_status_idx, WalSnd *walsnd)
{
    if (walsnd == NULL) {
        Assert(0);
        return ;
    }
    SpinLockAcquire(&walsnd->mutex_archive_task_list);
    walsnd->archive_task_list = lappend_int(walsnd->archive_task_list, archive_task_status_idx);
    walsnd->archive_task_count++;
    SpinLockRelease(&walsnd->mutex_archive_task_list);
}

ArchiveXlogMessage* get_archive_task_from_list()
{
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    SpinLockAcquire(&walsnd->mutex_archive_task_list);
    volatile unsigned int *archive_task_count = &walsnd->archive_task_count;
    if (*archive_task_count == 0) {
        SpinLockRelease(&walsnd->mutex_archive_task_list);
        return NULL;
    }
    ArchiveXlogMessage *result = NULL;
    int idx = -1;

    idx = lfirst_int(list_head(walsnd->archive_task_list));
    result = &g_instance.archive_obs_cxt.archive_status[idx].archive_task;
    walsnd->archive_task_list = list_delete_first(walsnd->archive_task_list);
    walsnd->archive_task_count--;
    SpinLockRelease(&walsnd->mutex_archive_task_list);
    return result;
}

/*
 * Calculate catchup rate of standby to estimate how long
 * the standby will be caught up with primary.
 */
static void CalCatchupRate()
{
    /* calculate catchup late every 1000ms */
    int calculateCatchupRateTime = 1000;
    if (u_sess->attr.attr_storage.catchup2normal_wait_time < 0) {
        return;
    }
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

    SpinLockAcquire(&walsnd->mutex);
    XLogRecPtr write = walsnd->write;
    TimestampTz now = GetCurrentTimestamp();

    if (XLByteEQ(walsnd->lastCalWrite, InvalidXLogRecPtr)) {
        walsnd->lastCalWrite = write;
        walsnd->lastCalTime = now;
        SpinLockRelease(&walsnd->mutex);
        return;
    }
    if (TimestampDifferenceExceeds(walsnd->lastCalTime, now, calculateCatchupRateTime) &&
        XLByteLT(walsnd->lastCalWrite, write)) {
        double tempRate = ((double)(now - walsnd->lastCalTime)) /
                          ((double)(XLByteDifference(write, walsnd->lastCalWrite)));
        walsnd->catchupRate = (walsnd->catchupRate == 0) ? tempRate : ((walsnd->catchupRate + tempRate) / 2);
        walsnd->lastCalWrite = write;
        walsnd->lastCalTime = now;
    }
    SpinLockRelease(&walsnd->mutex);
}

#define STREAMING_DR_REQUEST_SEND_INTERVAL 2500
static void WalSndHadrSwitchoverRequest()
{
    HadrSwitchoverMessage hadrSwithoverMessage;
    errno_t errorno = EOK;
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    TimestampTz lastRequestTimestamp = walsnd->lastRequestTimestamp;
    int interval = ComputeTimeStamp(lastRequestTimestamp);

    /* Send a request in 5 second */
    if (interval < STREAMING_DR_REQUEST_SEND_INTERVAL) {
        return;
    }

    walsnd->lastRequestTimestamp = GetCurrentTimestamp();
    /* Construct a new message */
    hadrSwithoverMessage.switchoverBarrierLsn = g_instance.streaming_dr_cxt.switchoverBarrierLsn;
    hadrSwithoverMessage.isMasterInstanceReady = walsnd->isMasterInstanceReady;

    /* Prepend with the message type and send it. */
    t_thrd.walsender_cxt.output_xlog_message[0] = 'S';
    errorno = memcpy_s(t_thrd.walsender_cxt.output_xlog_message + 1,
                       sizeof(WalDataMessageHeader) + g_instance.attr.attr_storage.MaxSendSize * 1024,
                       &hadrSwithoverMessage, sizeof(HadrSwitchoverMessage));
    securec_check(errorno, "\0", "\0");
    (void)pq_putmessage_noblock('d', t_thrd.walsender_cxt.output_xlog_message,
        sizeof(HadrSwitchoverMessage) + 1);

    if (walsnd->isMasterInstanceReady) {
        SpinLockAcquire(&walsnd->mutex);
        if (walsnd->interactiveState == SDRS_MASTER_INSTANCE_READY) {
            walsnd->interactiveState = SDRS_INTERACTION_COMPLETE;
            g_instance.streaming_dr_cxt.interactionCompletedNum++;
        }
        SpinLockRelease(&walsnd->mutex);
        ereport(LOG, (errmsg("master instance is ready in streaming dr switchover. "
            "interactiveState %d", (int32)(walsnd->interactiveState))));
    } else {
        ereport(LOG, (errmsg("sending streaming dr switchover request. "
            "interactiveState %d", (int32)(walsnd->interactiveState))));
    }
}

static void ProcessHadrSwitchoverMessage()
{
    HadrSwitchoverMessage hadrSwithoverMessage;
    XLogRecPtr switchoverBarrierLsn;
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;
    pq_copymsgbytes(t_thrd.walsender_cxt.reply_message, (char*)&hadrSwithoverMessage,
        sizeof(HadrSwitchoverMessage));

    switchoverBarrierLsn = hadrSwithoverMessage.switchoverBarrierLsn;

    /* Whether the interaction between the main cluster and the disaster recovery cluster is completed */
    if (g_instance.streaming_dr_cxt.switchoverBarrierLsn != InvalidXLogRecPtr &&
        XLByteEQ(g_instance.streaming_dr_cxt.switchoverBarrierLsn, switchoverBarrierLsn) &&
        XLByteEQ(g_instance.streaming_dr_cxt.switchoverBarrierLsn, walsnd->flush)) {
        SpinLockAcquire(&walsnd->mutex);
        if (walsnd->interactiveState == SDRS_INTERACTION_BEGIN) {
            walsnd->interactiveState = SDRS_MASTER_INSTANCE_READY;
            walsnd->isMasterInstanceReady = true;
        }
        SpinLockRelease(&walsnd->mutex);
    }

    ereport(LOG,
        (errmsg("ProcessHadrSwitchoverMessage: target switchover barrier lsn  %X/%X, "
            "receive switchover barrier lsn %X/%X, the hadr receiver flush Lsn is %X/%X, "
            "interactiveState %d, isMasterInstanceReady %d",
            (uint32)(g_instance.streaming_dr_cxt.switchoverBarrierLsn >> 32),
            (uint32)(g_instance.streaming_dr_cxt.switchoverBarrierLsn),
            (uint32)(switchoverBarrierLsn >> 32), (uint32)(switchoverBarrierLsn),
            (uint32)(walsnd->flush >> 32), (uint32)(walsnd->flush),
            (int32)(walsnd->interactiveState), walsnd->isMasterInstanceReady)));
}

static void ProcessHadrReplyMessage()
{
    HadrReplyMessage hadrReply;
    pq_copymsgbytes(t_thrd.walsender_cxt.reply_message, (char*)&hadrReply, sizeof(HadrReplyMessage));
    SpinLockAcquire(&g_instance.streaming_dr_cxt.mutex);
    if (BARRIER_LT((char *)g_instance.streaming_dr_cxt.targetBarrierId, (char *)hadrReply.targetBarrierId)) {
        int rc = strncpy_s((char *)g_instance.streaming_dr_cxt.targetBarrierId, MAX_BARRIER_ID_LENGTH,
            hadrReply.targetBarrierId, MAX_BARRIER_ID_LENGTH - 1);
        securec_check(rc, "\0", "\0");
    }
    SpinLockRelease(&g_instance.streaming_dr_cxt.mutex);
}

static int WalSndTimeout()
{
    const int MULTIPLE_TIME = 4;
    volatile WalSnd *walsnd = t_thrd.walsender_cxt.MyWalSnd;

    if (t_thrd.role == WAL_DB_SENDER || t_thrd.role == LOGICAL_READ_RECORD || t_thrd.role == PARALLEL_DECODE) {
        return u_sess->attr.attr_storage.logical_sender_timeout;
    } else if (walsnd == NULL) {
        /* DataSender -> IdentifyMode */
        return u_sess->attr.attr_storage.wal_sender_timeout;
    } else if (walsnd->sendRole == SNDROLE_PRIMARY_BUILDSTANDBY) {
        return MULTIPLE_TIME * t_thrd.walsender_cxt.timeoutCheckInternal;
    } else {
        return t_thrd.walsender_cxt.timeoutCheckInternal;
    }
}