Line data Source code
1 : /*
2 : * Copyright (c) 2013 Juniper Networks, Inc. All rights reserved.
3 : */
4 :
5 : #include "bgp/peer_close_manager.h"
6 :
7 :
8 : #include <list>
9 : #include <map>
10 :
11 : #include <boost/foreach.hpp>
12 :
13 : #include "base/task_annotations.h"
14 : #include "bgp/bgp_log.h"
15 : #include "bgp/bgp_membership.h"
16 : #include "bgp/bgp_peer_types.h"
17 : #include "bgp/bgp_route.h"
18 : #include "bgp/bgp_server.h"
19 : #include "bgp/routing-instance/routing_instance.h"
20 : #include "net/community_type.h"
21 :
22 : #define PEER_CLOSE_MANAGER_LOG(msg) \
23 : BGP_LOG_PEER(Event, peer_close_->peer(), SandeshLevel::SYS_INFO, \
24 : BGP_LOG_FLAG_ALL, BGP_PEER_DIR_NA, \
25 : "PeerCloseManager: State " << GetStateName(state_) << \
26 : ", MembershipState: " << GetMembershipStateName(membership_state_) << \
27 : ", MembershipReqPending: " << membership_req_pending_ << \
28 : ", CloseAgain?: " << (close_again_ ? "Yes" : "No") << ": " << msg);
29 :
30 : #define PEER_CLOSE_MANAGER_TABLE_LOG(msg) \
31 : BGP_LOG_PEER_TABLE(peer_close_->peer(), SandeshLevel::SYS_INFO, \
32 : BGP_LOG_FLAG_ALL, table, \
33 : "PeerCloseManager: State " << GetStateName(state_) << \
34 : ", MembershipState: " << GetMembershipStateName(membership_state_) << \
35 : ", MembershipReqPending: " << membership_req_pending_ << \
36 : ", CloseAgain?: " << (close_again_ ? "Yes" : "No") << ": " << msg);
37 :
38 : #define MOVE_TO_STATE(state) \
39 : do { \
40 : assert(state_ != state); \
41 : PEER_CLOSE_MANAGER_LOG("Move to state " << GetStateName(state)); \
42 : state_ = state; \
43 : } while (false)
44 :
45 : // Create an instance of PeerCloseManager with back reference to parent IPeer
46 8064 : PeerCloseManager::PeerCloseManager(IPeerClose *peer_close,
47 8064 : boost::asio::io_context *io_service) :
48 8064 : peer_close_(peer_close), gr_timer_(NULL),
49 16128 : event_queue_(new WorkQueue<Event *>(
50 24192 : TaskScheduler::GetInstance()->GetTaskId(
51 8064 : peer_close_->GetTaskName()),
52 8064 : peer_close_->GetTaskInstance(),
53 8064 : boost::bind(&PeerCloseManager::EventCallback, this, _1))),
54 8064 : state_(NONE), close_again_(false), graceful_(true), gr_elapsed_(0),
55 16128 : llgr_elapsed_(0), membership_state_(MEMBERSHIP_NONE) {
56 8064 : stats_.init++;
57 8064 : membership_req_pending_ = 0;
58 8064 : gr_timer_ = TimerManager::CreateTimer(*io_service,
59 : "Graceful Restart Timer");
60 8064 : }
61 :
62 : // Create an instance of PeerCloseManager with back reference to parent IPeer
63 20409 : PeerCloseManager::PeerCloseManager(IPeerClose *peer_close) :
64 20409 : peer_close_(peer_close), gr_timer_(NULL),
65 40820 : event_queue_(new WorkQueue<Event *>(
66 61229 : TaskScheduler::GetInstance()->GetTaskId(
67 20409 : peer_close_->GetTaskName()),
68 20410 : peer_close_->GetTaskInstance(),
69 20410 : boost::bind(&PeerCloseManager::EventCallback, this, _1))),
70 20410 : state_(NONE), close_again_(false), graceful_(true), gr_elapsed_(0),
71 40819 : llgr_elapsed_(0), membership_state_(MEMBERSHIP_NONE) {
72 20410 : stats_.init++;
73 20410 : membership_req_pending_ = 0;
74 20410 : if (peer_close->peer() && peer_close->peer()->server()) {
75 16595 : gr_timer_ =
76 16595 : TimerManager::CreateTimer(*peer_close->peer()->server()->ioservice(),
77 : "Graceful Restart Timer");
78 : }
79 20410 : }
80 :
81 45865 : PeerCloseManager::~PeerCloseManager() {
82 28474 : event_queue_->Shutdown();
83 28474 : TimerManager::DeleteTimer(gr_timer_);
84 45865 : }
85 :
86 225919 : std::string PeerCloseManager::GetStateName(State state) const {
87 225919 : switch (state) {
88 32562 : case NONE:
89 32562 : return "NONE";
90 68471 : case GR_TIMER:
91 68471 : return "GR_TIMER";
92 19452 : case STALE:
93 19452 : return "STALE";
94 5908 : case LLGR_STALE:
95 5908 : return "LLGR_STALE";
96 6508 : case LLGR_TIMER:
97 6508 : return "LLGR_TIMER";
98 10762 : case SWEEP:
99 10762 : return "SWEEP";
100 82256 : case DELETE:
101 82256 : return "DELETE";
102 : }
103 0 : assert(false);
104 : return "";
105 : }
106 :
107 203835 : std::string PeerCloseManager::GetMembershipStateName(
108 : MembershipState state) const {
109 203835 : switch (state) {
110 91326 : case MEMBERSHIP_NONE:
111 91326 : return "NONE";
112 108148 : case MEMBERSHIP_IN_USE:
113 108148 : return "IN_USE";
114 4361 : case MEMBERSHIP_IN_WAIT:
115 4361 : return "IN_WAIT";
116 : }
117 0 : assert(false);
118 : return "";
119 : }
120 :
121 53961 : std::string PeerCloseManager::GetEventName(EventType eventType) const {
122 53961 : switch (eventType) {
123 0 : case EVENT_NONE:
124 0 : return "NONE";
125 10164 : case CLOSE:
126 10164 : return "CLOSE";
127 5559 : case EOR_RECEIVED:
128 5559 : return "EOR_RECEIVED";
129 9690 : case MEMBERSHIP_REQUEST:
130 9690 : return "MEMBERSHIP_REQUEST";
131 25718 : case MEMBERSHIP_REQUEST_COMPLETE_CALLBACK:
132 25718 : return "MEMBERSHIP_REQUEST_COMPLETE_CALLBACK";
133 2830 : case TIMER_CALLBACK:
134 2830 : return "TIMER_CALLBACK";
135 : }
136 :
137 0 : return "";
138 : }
139 :
140 143426 : void PeerCloseManager::EnqueueEvent(Event *event) {
141 163950 : PEER_CLOSE_MANAGER_LOG("Enqueued event " <<
142 : GetEventName(event->event_type) <<
143 : ", graceful " << event->graceful <<
144 : ", family " << Address::FamilyToString(event->family));
145 143476 : event_queue_->Enqueue(event);
146 143642 : }
147 :
148 : // Trigger closure of an IPeer
149 : //
150 : // Graceful close_state_: NONE
151 : // RibIn Stale Marking and Ribout deletion close_state_: STALE
152 : // StateMachine restart and GR timer start close_state_: GR_TIMER
153 : //
154 : // Peer IsReady() in GR timer callback (or via reception of all EoRs)
155 : // RibIn Sweep and Ribout Generation close_state_: SWEEP
156 : // MembershipRequestCallback close_state_: NONE
157 : //
158 : // Peer not IsReady() in GR timer callback
159 : // If LLGR supported close_state_: LLGR_STALE
160 : // RibIn Stale marking with LLGR_STALE community close_state_: LLGR_TIMER
161 : //
162 : // Peer not IsReady() in LLGR timer callback
163 : // RibIn Delete close_state_: DELETE
164 : // MembershipRequestCallback close_state_: NONE
165 : //
166 : // Peer IsReady() in LLGR timer callback (or via reception of all EoRs)
167 : // RibIn Sweep close_state_: SWEEP
168 : // MembershipRequestCallback close_state_: NONE
169 : //
170 : // If LLGR is not supported
171 : // RibIn Delete close_state_: DELETE
172 : // MembershipRequestCallback close_state_: NONE
173 : //
174 : // Close() call during any state other than NONE and DELETE
175 : // Cancel GR timer and restart GR Closure all over again
176 : //
177 : // NonGraceful close_state_ = * (except DELETE)
178 : // A. RibIn deletion and Ribout deletion close_state_ = DELETE
179 : // B. MembershipRequestCallback => Peers delete/StateMachine restart
180 : // close_state_ = NONE
181 : //
182 : // If Close is restarted, account for GR timer's elapsed time.
183 : //
184 : // Use graceful as true to close gracefully.
185 20943 : void PeerCloseManager::Close(bool graceful) {
186 20943 : EnqueueEvent(new Event(CLOSE, graceful));
187 20946 : }
188 :
189 20946 : void PeerCloseManager::Close(Event *event) {
190 : // Note down non-graceful close trigger. Once non-graceful closure is
191 : // triggered, it should remain so until close process is complete. Further
192 : // graceful closure calls until then should remain non-graceful.
193 20946 : graceful_ &= event->graceful;
194 20946 : CloseInternal();
195 20946 : }
196 :
197 21479 : void PeerCloseManager::CloseInternal() {
198 21479 : stats_.close++;
199 :
200 : // Ignore nested closures
201 21479 : if (close_again_) {
202 4 : PEER_CLOSE_MANAGER_LOG("Nested close calls ignored");
203 4 : return;
204 : }
205 :
206 21475 : switch (state_) {
207 19931 : case NONE:
208 19931 : stats_.ResetRouteStats();
209 19931 : ProcessClosure();
210 19931 : break;
211 :
212 337 : case GR_TIMER:
213 463 : PEER_CLOSE_MANAGER_LOG("Nested close: Restart GR");
214 337 : close_again_ = true;
215 337 : stats_.nested++;
216 337 : gr_elapsed_ += gr_timer_->GetElapsedTime();
217 337 : CloseComplete();
218 337 : break;
219 :
220 196 : case LLGR_TIMER:
221 196 : PEER_CLOSE_MANAGER_LOG("Nested close: Restart LLGR");
222 196 : close_again_ = true;
223 196 : stats_.nested++;
224 196 : llgr_elapsed_ += gr_timer_->GetElapsedTime();
225 196 : CloseComplete();
226 196 : break;
227 :
228 1011 : case STALE:
229 : case LLGR_STALE:
230 : case SWEEP:
231 : case DELETE:
232 1011 : PEER_CLOSE_MANAGER_LOG("Nested close");
233 1011 : close_again_ = true;
234 1011 : stats_.nested++;
235 1011 : break;
236 : }
237 : }
238 :
239 14822 : void PeerCloseManager::ProcessEORMarkerReceived(Address::Family family) {
240 14822 : EnqueueEvent(new Event(EOR_RECEIVED, family));
241 14824 : }
242 :
243 14824 : void PeerCloseManager::ProcessEORMarkerReceived(Event *event) {
244 14824 : if ((state_ == GR_TIMER || state_ == LLGR_TIMER) && !families_.empty()) {
245 1842 : if (event->family == Address::UNSPEC) {
246 40 : families_.clear();
247 : } else {
248 1802 : families_.erase(event->family);
249 : }
250 :
251 : // Start the timer if all EORs have been received.
252 1842 : if (families_.empty())
253 1227 : StartRestartTimer(0);
254 : }
255 14824 : }
256 :
257 : // Process RibIn during peer closure.
258 2684 : void PeerCloseManager::StartRestartTimer(int time) {
259 2684 : gr_timer_->Cancel();
260 2948 : PEER_CLOSE_MANAGER_LOG("GR Timer started to fire after " << time/1000 <<
261 : " seconds");
262 2684 : gr_timer_->Start(time,
263 : boost::bind(&PeerCloseManager::RestartTimerCallback, this));
264 2684 : }
265 :
266 2834 : bool PeerCloseManager::RestartTimerCallback() {
267 2834 : CHECK_CONCURRENCY("timer::TimerTask");
268 2834 : EnqueueEvent(new Event(TIMER_CALLBACK));
269 2834 : return false;
270 : }
271 :
272 2834 : void PeerCloseManager::RestartTimerCallback(Event *event) {
273 2834 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
274 :
275 2944 : PEER_CLOSE_MANAGER_LOG("GR Timer callback started");
276 2834 : if (state_ != GR_TIMER && state_ != LLGR_TIMER)
277 960 : return;
278 :
279 1874 : if (peer_close_->IsReady() && !families_.empty()) {
280 : // Fake reception of all EORs.
281 204 : for (IPeerClose::Families::iterator i = families_.begin(), next = i;
282 408 : i != families_.end(); i = next) {
283 204 : next++;
284 216 : PEER_CLOSE_MANAGER_LOG("Simulate EoR reception for family " << *i);
285 204 : peer_close_->ReceiveEndOfRIB(*i);
286 : }
287 : } else {
288 1670 : ProcessClosure();
289 : }
290 : }
291 :
292 : // Route stale timer callback. If the peer has come back up, sweep routes for
293 : // those address families that are still active. Delete the rest
294 21601 : void PeerCloseManager::ProcessClosure() {
295 : // If the peer is back up and this address family is still supported,
296 : // sweep old paths which may not have come back in the new session
297 21601 : switch (state_) {
298 19931 : case NONE:
299 19931 : if (!graceful_ || !peer_close_->IsCloseGraceful()) {
300 19702 : MOVE_TO_STATE(DELETE);
301 18903 : stats_.deletes++;
302 : } else {
303 1223 : MOVE_TO_STATE(STALE);
304 1028 : stats_.stale++;
305 1028 : StaleNotify();
306 1028 : return;
307 : }
308 18903 : break;
309 1107 : case GR_TIMER:
310 1107 : if (peer_close_->IsReady()) {
311 745 : MOVE_TO_STATE(SWEEP);
312 705 : gr_elapsed_ = 0;
313 705 : llgr_elapsed_ = 0;
314 705 : stats_.sweep++;
315 705 : break;
316 : }
317 402 : if (peer_close_->IsCloseLongLivedGraceful()) {
318 311 : MOVE_TO_STATE(LLGR_STALE);
319 282 : stats_.llgr_stale++;
320 282 : peer_close_->LongLivedGracefulRestartStale();
321 282 : break;
322 : }
323 120 : MOVE_TO_STATE(DELETE);
324 120 : stats_.deletes++;
325 120 : break;
326 :
327 563 : case LLGR_TIMER:
328 563 : if (peer_close_->IsReady()) {
329 319 : MOVE_TO_STATE(SWEEP);
330 319 : gr_elapsed_ = 0;
331 319 : llgr_elapsed_ = 0;
332 319 : stats_.sweep++;
333 319 : break;
334 : }
335 273 : MOVE_TO_STATE(DELETE);
336 244 : stats_.deletes++;
337 244 : break;
338 :
339 0 : case STALE:
340 : case LLGR_STALE:
341 : case SWEEP:
342 : case DELETE:
343 0 : assert(false);
344 : return;
345 : }
346 :
347 20573 : if (state_ == DELETE)
348 19267 : peer_close_->CustomClose();
349 20573 : MembershipRequest();
350 : }
351 :
352 1375 : void PeerCloseManager::CloseComplete() {
353 1541 : MOVE_TO_STATE(NONE);
354 1375 : gr_timer_->Cancel();
355 1375 : families_.clear();
356 1375 : stats_.init++;
357 :
358 : // Nested closures trigger fresh GR
359 1375 : if (close_again_) {
360 533 : close_again_ = false;
361 533 : CloseInternal();
362 : }
363 1375 : }
364 :
365 1418 : bool PeerCloseManager::AssertSweepState(bool do_assert) {
366 1418 : bool check = (state_ == SWEEP);
367 1418 : if (do_assert)
368 650 : assert(check);
369 1418 : return check;
370 : }
371 :
372 95239 : bool PeerCloseManager::AssertMembershipManagerInUse(bool do_assert) {
373 95239 : bool check = false;
374 181710 : check |= (state_ == STALE || state_ == LLGR_STALE || state_ == SWEEP ||
375 86471 : state_ == DELETE);
376 95239 : check |= (membership_state_ == MEMBERSHIP_IN_USE);
377 95239 : check |= (membership_req_pending_ > 0);
378 95239 : if (do_assert)
379 93895 : assert(check);
380 95239 : return check;
381 : }
382 :
383 23005 : bool PeerCloseManager::AssertMembershipState(bool do_assert) {
384 23005 : bool check = (membership_state_ != MEMBERSHIP_IN_USE);
385 23005 : if (do_assert)
386 20339 : assert(check);
387 23005 : return check;
388 : }
389 :
390 21210 : bool PeerCloseManager::AssertMembershipReqCount(bool do_assert) {
391 21210 : bool check = !membership_req_pending_;
392 21210 : if (do_assert)
393 20279 : assert(check);
394 21210 : return check;
395 : }
396 :
397 1418 : void PeerCloseManager::TriggerSweepStateActions() {
398 1418 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
399 1418 : if (!AssertSweepState())
400 576 : return;
401 :
402 : // Notify clients to trigger sweep as appropriate.
403 842 : peer_close_->GracefulRestartSweep();
404 :
405 : // Reset MembershipUse state after client has been notified above.
406 842 : set_membership_state(MEMBERSHIP_NONE);
407 842 : CloseComplete();
408 : }
409 :
410 : // Notify clients about entering Stale event.
411 1028 : void PeerCloseManager::StaleNotify() {
412 1028 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
413 :
414 1028 : peer_close_->GracefulRestartStale();
415 1028 : if (!AssertMembershipState())
416 48 : return;
417 980 : MembershipRequest(NULL);
418 : }
419 :
420 19455 : bool PeerCloseManager::CanUseMembershipManager() const {
421 19455 : return peer_close_->peer()->CanUseMembershipManager();
422 : }
423 :
424 20279 : void PeerCloseManager::GetRegisteredRibs(std::list<BgpTable *> *tables) {
425 20279 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
426 20279 : mgr->GetRegisteredRibs(peer_close_->peer(), tables);
427 20279 : }
428 :
429 83472 : bool PeerCloseManager::IsRegistered(BgpTable *table) const {
430 83472 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
431 83472 : return mgr->IsRegistered(peer_close_->peer(), table);
432 : }
433 :
434 73472 : void PeerCloseManager::Unregister(BgpTable *table) {
435 73472 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
436 73472 : mgr->Unregister(peer_close_->peer(), table);
437 73472 : }
438 :
439 3807 : void PeerCloseManager::WalkRibIn(BgpTable *table) {
440 3807 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
441 3807 : mgr->WalkRibIn(peer_close_->peer(), table);
442 3807 : }
443 :
444 4385 : void PeerCloseManager::UnregisterRibOut(BgpTable *table) {
445 4385 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
446 4385 : mgr->UnregisterRibOut(peer_close_->peer(), table);
447 4385 : }
448 :
449 4009 : bool PeerCloseManager::IsRibInRegistered(BgpTable *table) const {
450 4009 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
451 4009 : return mgr->IsRibInRegistered(peer_close_->peer(), table);
452 : }
453 :
454 1808 : void PeerCloseManager::UnregisterRibIn(BgpTable *table) {
455 1808 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
456 1808 : mgr->UnregisterRibIn(peer_close_->peer(), table);
457 1808 : }
458 :
459 21977 : void PeerCloseManager::MembershipRequest() {
460 21977 : if (!AssertMembershipState())
461 848 : return;
462 :
463 : // Pause if membership manager is not ready for usage.
464 21129 : if (!CanUseMembershipManager()) {
465 899 : set_membership_state(MEMBERSHIP_IN_WAIT);
466 935 : PEER_CLOSE_MANAGER_LOG("Wait for membership manager availability");
467 899 : return;
468 : }
469 20230 : set_membership_state(MEMBERSHIP_IN_USE);
470 20230 : EnqueueEvent(new Event(MEMBERSHIP_REQUEST));
471 : }
472 :
473 21210 : void PeerCloseManager::MembershipRequest(Event *evnet) {
474 21210 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
475 :
476 21210 : set_membership_state(MEMBERSHIP_IN_USE);
477 21210 : if (!AssertMembershipReqCount())
478 10871 : return;
479 20762 : membership_req_pending_++;
480 20762 : std::list<BgpTable *> tables;
481 20762 : GetRegisteredRibs(&tables);
482 :
483 20762 : if (tables.empty()) {
484 10423 : assert(MembershipRequestCallback(NULL));
485 10423 : return;
486 : }
487 :
488 : // Account for extra increment above.
489 10339 : membership_req_pending_--;
490 178249 : BOOST_FOREACH(BgpTable *table, tables) {
491 83955 : membership_req_pending_++;
492 83955 : if (IsRegistered(table)) {
493 79706 : if (state_ == PeerCloseManager::DELETE) {
494 100198 : PEER_CLOSE_MANAGER_TABLE_LOG(
495 : "MembershipManager::Unregister");
496 73589 : Unregister(table);
497 6117 : } else if (state_ == PeerCloseManager::SWEEP) {
498 3691 : PEER_CLOSE_MANAGER_TABLE_LOG("MembershipManager::WalkRibIn");
499 1669 : WalkRibIn(table);
500 : } else {
501 11711 : PEER_CLOSE_MANAGER_TABLE_LOG(
502 : "MembershipManager::UnregisterRibOut");
503 4448 : UnregisterRibOut(table);
504 : }
505 : } else {
506 4249 : assert(IsRibInRegistered(table));
507 4249 : if (state_ == PeerCloseManager::DELETE) {
508 5035 : PEER_CLOSE_MANAGER_TABLE_LOG(
509 : "MembershipManager::UnregisterRibIn");
510 1926 : UnregisterRibIn(table);
511 : } else {
512 6105 : PEER_CLOSE_MANAGER_TABLE_LOG("MembershipManager::WalkRibIn");
513 2323 : WalkRibIn(table);
514 : }
515 : }
516 : }
517 20762 : }
518 :
519 84599 : void PeerCloseManager::MembershipRequestCallback() {
520 84599 : EnqueueEvent(new Event(MEMBERSHIP_REQUEST_COMPLETE_CALLBACK));
521 84810 : }
522 :
523 : // Close process for this peer in terms of walking RibIns and RibOuts are
524 : // complete. Do the final cleanups necessary and notify interested party
525 : //
526 : // Retrun true if we are done using membership manager, false otherwise.
527 95239 : bool PeerCloseManager::MembershipRequestCallback(Event *event) {
528 95239 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
529 :
530 95239 : bool result = false;
531 113835 : PEER_CLOSE_MANAGER_LOG("MembershipRequestCallback");
532 :
533 95239 : if (!AssertMembershipManagerInUse())
534 0 : return result;
535 95239 : if (--membership_req_pending_)
536 73616 : return result;
537 :
538 : // Indicate to the caller that we are done using the membership manager.
539 21623 : result = true;
540 :
541 21623 : if (state_ == DELETE) {
542 19576 : MOVE_TO_STATE(NONE);
543 18748 : peer_close_->Delete();
544 18748 : gr_elapsed_ = 0;
545 18748 : llgr_elapsed_ = 0;
546 18748 : stats_.init++;
547 18748 : close_again_ = false;
548 18748 : graceful_ = true;
549 18748 : set_membership_state(MEMBERSHIP_NONE);
550 18748 : return result;
551 : }
552 :
553 : // Process nested closures.
554 2875 : if (close_again_) {
555 0 : set_membership_state(MEMBERSHIP_NONE);
556 0 : CloseComplete();
557 :
558 : // Nested closure can make membership manager to be in use again.
559 0 : return membership_state_ != MEMBERSHIP_IN_USE;
560 : }
561 :
562 : // If any GR stale timer has to be launched, then to wait for some time
563 : // hoping for the peer (and the paths) to come back up.
564 2875 : if (state_ == STALE) {
565 1076 : peer_close_->CloseComplete();
566 1271 : MOVE_TO_STATE(GR_TIMER);
567 1076 : peer_close_->GetGracefulRestartFamilies(&families_);
568 :
569 : // Offset restart time with elapsed time during nested closures.
570 1076 : int time = peer_close_->GetGracefulRestartTime() * 1000;
571 1076 : time -= gr_elapsed_;
572 1076 : if (time < 0)
573 0 : time = 0;
574 1076 : StartRestartTimer(time);
575 1076 : stats_.gr_timer++;
576 1076 : set_membership_state(MEMBERSHIP_NONE);
577 1076 : return result;
578 : }
579 :
580 : // From LLGR_STALE state, switch to LLGR_TIMER state. Typically this would
581 : // be a very long timer, and we expect to receive EORs before this timer
582 : // expires.
583 : // Just like for GRSTALE in the above case, before moving to LLGR_TIMER and
584 : // starting LLGR_TIMER, we can check if the peer can come back up.
585 1799 : if (state_ == LLGR_STALE) {
586 410 : MOVE_TO_STATE(LLGR_TIMER);
587 381 : peer_close_->CloseComplete();
588 381 : peer_close_->GetLongLivedGracefulRestartFamilies(&families_);
589 :
590 : // Offset restart time with elapsed time during nested closures.
591 381 : int time = peer_close_->GetLongLivedGracefulRestartTime() * 1000;
592 381 : time -= llgr_elapsed_;
593 381 : if (time < 0)
594 0 : time = 0;
595 381 : StartRestartTimer(time);
596 381 : stats_.llgr_timer++;
597 381 : set_membership_state(MEMBERSHIP_NONE);
598 381 : return result;
599 : }
600 :
601 1418 : TriggerSweepStateActions();
602 1418 : return result;
603 : }
604 :
605 62777 : void PeerCloseManager::FillRouteCloseInfo(PeerCloseInfo *close_info) const {
606 62777 : std::map<std::string, PeerCloseRouteInfo> route_stats;
607 :
608 690547 : for (int i = 0; i < Address::NUM_FAMILIES; i++) {
609 627770 : if (!stats_.route_stats[i].IsSet())
610 472957 : continue;
611 154813 : PeerCloseRouteInfo route_info;
612 154813 : route_info.set_staled(stats_.route_stats[i].staled);
613 154813 : route_info.set_llgr_staled(stats_.route_stats[i].llgr_staled);
614 154813 : route_info.set_refreshed(stats_.route_stats[i].refreshed);
615 154813 : route_info.set_fresh(stats_.route_stats[i].fresh);
616 154813 : route_info.set_deleted(stats_.route_stats[i].deleted);
617 154813 : route_stats[Address::FamilyToString(static_cast<Address::Family>(i))] = route_info;
618 154813 : }
619 :
620 62777 : if (!route_stats.empty())
621 61964 : close_info->set_route_stats(route_stats);
622 62777 : }
623 :
624 62777 : BgpNeighborResp *PeerCloseManager::FillCloseInfo(BgpNeighborResp *resp) const {
625 62777 : PeerCloseInfo peer_close_info;
626 62777 : peer_close_info.set_state(GetStateName(state_));
627 62777 : peer_close_info.set_membership_state(
628 125554 : GetMembershipStateName(membership_state_));
629 62777 : peer_close_info.set_close_again(close_again_);
630 62777 : peer_close_info.set_graceful(graceful_);
631 62777 : peer_close_info.set_init(stats_.init);
632 62777 : peer_close_info.set_close(stats_.close);
633 62777 : peer_close_info.set_nested(stats_.nested);
634 62777 : peer_close_info.set_deletes(stats_.deletes);
635 62777 : peer_close_info.set_stale(stats_.stale);
636 62777 : peer_close_info.set_llgr_stale(stats_.llgr_stale);
637 62777 : peer_close_info.set_sweep(stats_.sweep);
638 62777 : peer_close_info.set_gr_timer(stats_.gr_timer);
639 62777 : peer_close_info.set_llgr_timer(stats_.llgr_timer);
640 62777 : FillRouteCloseInfo(&peer_close_info);
641 :
642 62777 : resp->set_peer_close_info(peer_close_info);
643 :
644 62777 : return resp;
645 62777 : }
646 :
647 216846 : void PeerCloseManager::UpdateRouteStats(Address::Family family,
648 : const BgpPath *old_path, uint32_t path_flags) const {
649 216846 : if (state_ == NONE)
650 196932 : return;
651 :
652 19914 : if (!old_path)
653 58 : stats_.route_stats[family].fresh++;
654 19856 : else if (old_path->IsStale() && !(path_flags & BgpPath::Stale))
655 3378 : stats_.route_stats[family].refreshed++;
656 : }
657 :
658 100941 : bool PeerCloseManager::MembershipPathCallback(DBTablePartBase *root,
659 : BgpRoute *rt, BgpPath *path) {
660 100941 : CHECK_CONCURRENCY("db::DBTable");
661 100961 : DBRequest::DBOperation oper = DBRequest::DB_ENTRY_INVALID;
662 100961 : BgpAttrPtr attrs;
663 :
664 100961 : BgpTable *table = static_cast<BgpTable *>(root->parent());
665 100959 : assert(table);
666 :
667 100959 : uint32_t stale = 0;
668 :
669 100959 : switch (state_) {
670 0 : case NONE:
671 : case GR_TIMER:
672 : case LLGR_TIMER:
673 0 : return false;
674 :
675 6036 : case SWEEP:
676 :
677 : // Stale paths must be deleted.
678 6036 : if (!path->IsStale() && !path->IsLlgrStale())
679 2880 : return false;
680 3157 : if (path->IsStale()) {
681 3156 : path->ResetStale();
682 3156 : table->UpdateStalePathCount(-1);
683 : }
684 3158 : if (path->IsLlgrStale()) {
685 0 : path->ResetLlgrStale();
686 0 : table->UpdateLlgrStalePathCount(-1);
687 : }
688 3158 : oper = DBRequest::DB_ENTRY_DELETE;
689 3158 : attrs = NULL;
690 3157 : stats_.route_stats[table->family()].deleted++;
691 3158 : break;
692 :
693 76946 : case DELETE:
694 :
695 : // This path must be deleted. Hence attr is not required.
696 76946 : oper = DBRequest::DB_ENTRY_DELETE;
697 76946 : attrs = NULL;
698 76943 : stats_.route_stats[table->family()].deleted++;
699 76976 : break;
700 :
701 14747 : case STALE:
702 :
703 : // We do not support GR for multicast routes (yet).
704 29496 : if ((table->family() == Address::ERMVPN) ||
705 14749 : (table->family() == Address::MVPN)) {
706 0 : oper = DBRequest::DB_ENTRY_DELETE;
707 0 : attrs = NULL;
708 0 : stats_.route_stats[table->family()].deleted++;
709 0 : break;
710 : }
711 :
712 : // If path is already marked as stale, then there is no need to
713 : // process again. This can happen if the session flips while in
714 : // GR_TIMER state.
715 14748 : if (path->IsStale())
716 3285 : return false;
717 :
718 : // This path must be marked for staling. Update the local
719 : // preference and update the route accordingly.
720 11465 : oper = DBRequest::DB_ENTRY_ADD_CHANGE;
721 11465 : attrs = path->GetAttr();
722 11470 : stale = BgpPath::Stale;
723 11470 : stats_.route_stats[table->family()].staled++;
724 11469 : break;
725 :
726 3233 : case LLGR_STALE:
727 :
728 : // If the path has NO_LLGR community, DELETE it.
729 3233 : if (path->GetAttr()->community() &&
730 0 : path->GetAttr()->community()->ContainsValue(
731 : CommunityType::NoLlgr)) {
732 0 : oper = DBRequest::DB_ENTRY_DELETE;
733 0 : attrs = NULL;
734 0 : stats_.route_stats[table->family()].deleted++;
735 0 : break;
736 : }
737 :
738 : // If path is already marked as llgr_stale, then there is no
739 : // need to process again. This can happen if the session flips
740 : // while in LLGR_TIMER state.
741 3232 : if (path->IsLlgrStale())
742 0 : return false;
743 :
744 3232 : attrs = path->GetAttr();
745 3236 : stale = BgpPath::LlgrStale;
746 3236 : oper = DBRequest::DB_ENTRY_ADD_CHANGE;
747 3236 : stats_.route_stats[table->family()].llgr_staled++;
748 3235 : break;
749 : }
750 :
751 : // Feed the route modify/delete request to the table input process.
752 284499 : return table->InputCommon(root, rt, path, peer_close_->peer(), NULL, oper,
753 94832 : attrs, path->GetPathId(), path->GetFlags() | stale, path->GetLabel(),
754 94832 : path->GetL3Label());
755 100995 : }
756 :
757 : //
758 : // Handler for an Event.
759 : //
760 143650 : bool PeerCloseManager::EventCallback(Event *event) {
761 143650 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
762 : bool result;
763 :
764 143650 : switch (event->event_type) {
765 0 : case EVENT_NONE:
766 0 : break;
767 20946 : case CLOSE:
768 20946 : Close(event);
769 20946 : break;
770 14824 : case EOR_RECEIVED:
771 14824 : ProcessEORMarkerReceived(event);
772 14824 : break;
773 20230 : case MEMBERSHIP_REQUEST:
774 20230 : MembershipRequest(event);
775 20230 : break;
776 84816 : case MEMBERSHIP_REQUEST_COMPLETE_CALLBACK:
777 84816 : result = MembershipRequestCallback(event);
778 :
779 : // Notify clients if we are no longer using the membership mgr.
780 84816 : if (result)
781 11200 : peer_close_->MembershipRequestCallbackComplete();
782 84816 : break;
783 2834 : case TIMER_CALLBACK:
784 2834 : RestartTimerCallback(event);
785 2834 : break;
786 : }
787 :
788 143650 : delete event;
789 143650 : return true;
790 : }
|