From: Christopher Faulet Date: Mon, 29 Sep 2025 13:48:18 +0000 (+0200) Subject: MAJOR: peers: Stop to track acked updates per shared table X-Git-Url: http://git.ipfire.org/gitweb.cgi?a=commitdiff_plain;h=4e181a2c26ed3254ed1b7bc4bef1135cbc55ec4a;p=thirdparty%2Fhaproxy.git MAJOR: peers: Stop to track acked updates per shared table This patch is quite small but the change is really important. Thanks to the previous patch, we can use PEER_F_SYNCHED flag to know if a peer is synchronized or not. So instead of tracking last ack messages for each table to be able to restart at a given point when the peer reconnects, we decided to restart from the begining if a peer is not synchronized when a new connection is established. So, it is a huge change because, on reconnect, instead of pushing some missed updates, all local updates are pushed again. Most of time, it is not a problem because nowadays, connection are quite stable, especially because a heartbeat message is sent to keep it active. The only drawback is when a peer is restarted. In that case, we have no way to know it is synchronized because he learned table contents from it old local peer. This change is mandatory. First to replace the update tree by a mt-list and remove the update lock. Then to split this list by buckets to reduce contention. --- diff --git a/include/haproxy/peers-t.h b/include/haproxy/peers-t.h index ee48d73da..439e9ce0e 100644 --- a/include/haproxy/peers-t.h +++ b/include/haproxy/peers-t.h @@ -143,7 +143,6 @@ struct shared_table { unsigned int last_pushed; unsigned int last_get; unsigned int teaching_origin; - unsigned int update; struct shared_table *next; /* next shared table in list */ }; diff --git a/src/peers.c b/src/peers.c index 30783f9f8..7d955008f 100644 --- a/src/peers.c +++ b/src/peers.c @@ -2212,7 +2212,6 @@ static inline int peer_treat_ackmsg(struct appctx *appctx, struct peer *p, /* ack message */ uint32_t table_id ; uint32_t update; - struct shared_table *st; int ret = 1; TRACE_ENTER(PEERS_EV_SESS_IO|PEERS_EV_RX_MSG|PEERS_EV_PROTO_ACK, appctx, p); @@ -2233,19 +2232,13 @@ static inline int peer_treat_ackmsg(struct appctx *appctx, struct peer *p, memcpy(&update, *msg_cur, sizeof(update)); update = ntohl(update); - for (st = p->tables; st; st = st->next) { - if (st->local_id == table_id) { - st->update = update; - break; - } - } if (table_id == p->last.table->local_id && update == p->last.id) { TRACE_STATE("Peer synched again", PEERS_EV_SESS_IO|PEERS_EV_RX_MSG|PEERS_EV_PROTO_ACK, appctx, p); p->flags |= PEER_F_SYNCHED; } end: - TRACE_LEAVE(PEERS_EV_SESS_IO|PEERS_EV_RX_MSG|PEERS_EV_PROTO_ACK, appctx, p, st); + TRACE_LEAVE(PEERS_EV_SESS_IO|PEERS_EV_RX_MSG|PEERS_EV_PROTO_ACK, appctx, p); return ret; } @@ -2582,7 +2575,7 @@ static inline int peer_treat_awaited_msg(struct appctx *appctx, struct peer *pee TRACE_PROTO("Resync request message received", PEERS_EV_SESS_IO|PEERS_EV_RX_MSG|PEERS_EV_PROTO_CTRL, appctx, peer); /* prepare tables for a global push */ for (st = peer->tables; st; st = st->next) { - st->teaching_origin = st->last_pushed = st->update; + st->teaching_origin = st->last_pushed; st->flags = 0; } @@ -2627,7 +2620,7 @@ static inline int peer_treat_awaited_msg(struct appctx *appctx, struct peer *pee } peer->flags |= PEER_F_SYNCHED; for (st = peer->tables; st; st = st->next) { - st->update = st->last_pushed = st->teaching_origin; + st->last_pushed = st->teaching_origin; st->flags = 0; } @@ -2962,21 +2955,22 @@ static inline void init_connected_peer(struct peer *peer, struct peers *peers) /* Init cursors */ for (st = peer->tables; st ; st = st->next) { st->last_get = st->last_acked = 0; + HA_RWLOCK_WRLOCK(STK_TABLE_UPDT_LOCK, &st->table->updt_lock); - /* if st->update appears to be in future it means - * that the last acked value is very old and we + /* if st->last_pushed appears to be in future it means + * that the last update is very old and we * remain unconnected a too long time to use this * acknowledgement as a reset. * We should update the protocol to be able to * signal the remote peer that it needs a full resync. - * Here a partial fix consist to set st->update at + * Here a partial fix consist to set st->last_pushed at * the max past value. */ - if (!(peer->flags & PEER_F_SYNCHED) || (int)(st->table->localupdate - st->update) < 0) { - st->update = st->table->localupdate + (2147483648U); + if (!(peer->flags & PEER_F_SYNCHED) || (int)(st->table->localupdate - st->last_pushed) < 0) { + st->last_pushed = st->table->localupdate + (2147483648U); peer->flags &= ~PEER_F_SYNCHED; } - st->teaching_origin = st->last_pushed = st->update; + st->teaching_origin = st->last_pushed; st->flags = 0; HA_RWLOCK_WRUNLOCK(STK_TABLE_UPDT_LOCK, &st->table->updt_lock); @@ -4318,8 +4312,8 @@ static int peers_dump_peer(struct buffer *msg, struct appctx *appctx, struct pee st, st->local_id, st->remote_id, st->flags, (unsigned long long)st->remote_data); chunk_appendf(&trash, "\n last_acked=%u last_pushed=%u last_get=%u" - " teaching_origin=%u update=%u", - st->last_acked, st->last_pushed, st->last_get, st->teaching_origin, st->update); + " teaching_origin=%u", + st->last_acked, st->last_pushed, st->last_get, st->teaching_origin); chunk_appendf(&trash, "\n table:%p id=%s update=%u localupdate=%u refcnt=%u", t, t->id, t->update, t->localupdate, t->refcnt); if (flags & PEERS_SHOW_F_DICT) {