Line data Source code
1 : /*
2 : * Copyright (c) 2013 Juniper Networks, Inc. All rights reserved.
3 : */
4 :
5 : #include "bgp/peer_close_manager.h"
6 :
7 :
8 : #include <list>
9 : #include <map>
10 :
11 : #include <boost/foreach.hpp>
12 :
13 : #include "base/task_annotations.h"
14 : #include "bgp/bgp_log.h"
15 : #include "bgp/bgp_membership.h"
16 : #include "bgp/bgp_peer_types.h"
17 : #include "bgp/bgp_route.h"
18 : #include "bgp/bgp_server.h"
19 : #include "bgp/routing-instance/routing_instance.h"
20 : #include "net/community_type.h"
21 :
22 : #define PEER_CLOSE_MANAGER_LOG(msg) \
23 : BGP_LOG_PEER(Event, peer_close_->peer(), SandeshLevel::SYS_INFO, \
24 : BGP_LOG_FLAG_ALL, BGP_PEER_DIR_NA, \
25 : "PeerCloseManager: State " << GetStateName(state_) << \
26 : ", MembershipState: " << GetMembershipStateName(membership_state_) << \
27 : ", MembershipReqPending: " << membership_req_pending_ << \
28 : ", CloseAgain?: " << (close_again_ ? "Yes" : "No") << ": " << msg);
29 :
30 : #define PEER_CLOSE_MANAGER_TABLE_LOG(msg) \
31 : BGP_LOG_PEER_TABLE(peer_close_->peer(), SandeshLevel::SYS_INFO, \
32 : BGP_LOG_FLAG_ALL, table, \
33 : "PeerCloseManager: State " << GetStateName(state_) << \
34 : ", MembershipState: " << GetMembershipStateName(membership_state_) << \
35 : ", MembershipReqPending: " << membership_req_pending_ << \
36 : ", CloseAgain?: " << (close_again_ ? "Yes" : "No") << ": " << msg);
37 :
38 : #define MOVE_TO_STATE(state) \
39 : do { \
40 : assert(state_ != state); \
41 : PEER_CLOSE_MANAGER_LOG("Move to state " << GetStateName(state)); \
42 : state_ = state; \
43 : } while (false)
44 :
45 : // Create an instance of PeerCloseManager with back reference to parent IPeer
46 8064 : PeerCloseManager::PeerCloseManager(IPeerClose *peer_close,
47 8064 : boost::asio::io_context *io_service) :
48 8064 : peer_close_(peer_close), gr_timer_(NULL),
49 16128 : event_queue_(new WorkQueue<Event *>(
50 24192 : TaskScheduler::GetInstance()->GetTaskId(
51 8064 : peer_close_->GetTaskName()),
52 8064 : peer_close_->GetTaskInstance(),
53 8064 : boost::bind(&PeerCloseManager::EventCallback, this, _1))),
54 8064 : state_(NONE), close_again_(false), graceful_(true), gr_elapsed_(0),
55 16128 : llgr_elapsed_(0), membership_state_(MEMBERSHIP_NONE) {
56 8064 : stats_.init++;
57 8064 : membership_req_pending_ = 0;
58 8064 : gr_timer_ = TimerManager::CreateTimer(*io_service,
59 : "Graceful Restart Timer");
60 8064 : }
61 :
62 : // Create an instance of PeerCloseManager with back reference to parent IPeer
63 20402 : PeerCloseManager::PeerCloseManager(IPeerClose *peer_close) :
64 20402 : peer_close_(peer_close), gr_timer_(NULL),
65 40804 : event_queue_(new WorkQueue<Event *>(
66 61206 : TaskScheduler::GetInstance()->GetTaskId(
67 20402 : peer_close_->GetTaskName()),
68 20402 : peer_close_->GetTaskInstance(),
69 20402 : boost::bind(&PeerCloseManager::EventCallback, this, _1))),
70 20402 : state_(NONE), close_again_(false), graceful_(true), gr_elapsed_(0),
71 40804 : llgr_elapsed_(0), membership_state_(MEMBERSHIP_NONE) {
72 20402 : stats_.init++;
73 20402 : membership_req_pending_ = 0;
74 20402 : if (peer_close->peer() && peer_close->peer()->server()) {
75 16587 : gr_timer_ =
76 16587 : TimerManager::CreateTimer(*peer_close->peer()->server()->ioservice(),
77 : "Graceful Restart Timer");
78 : }
79 20402 : }
80 :
81 45853 : PeerCloseManager::~PeerCloseManager() {
82 28466 : event_queue_->Shutdown();
83 28466 : TimerManager::DeleteTimer(gr_timer_);
84 45853 : }
85 :
86 225600 : std::string PeerCloseManager::GetStateName(State state) const {
87 225600 : switch (state) {
88 32533 : case NONE:
89 32533 : return "NONE";
90 68486 : case GR_TIMER:
91 68486 : return "GR_TIMER";
92 19512 : case STALE:
93 19512 : return "STALE";
94 5879 : case LLGR_STALE:
95 5879 : return "LLGR_STALE";
96 6254 : case LLGR_TIMER:
97 6254 : return "LLGR_TIMER";
98 10726 : case SWEEP:
99 10726 : return "SWEEP";
100 82212 : case DELETE:
101 82212 : return "DELETE";
102 : }
103 0 : assert(false);
104 : return "";
105 : }
106 :
107 203518 : std::string PeerCloseManager::GetMembershipStateName(
108 : MembershipState state) const {
109 203518 : switch (state) {
110 91047 : case MEMBERSHIP_NONE:
111 91047 : return "NONE";
112 108108 : case MEMBERSHIP_IN_USE:
113 108108 : return "IN_USE";
114 4363 : case MEMBERSHIP_IN_WAIT:
115 4363 : return "IN_WAIT";
116 : }
117 0 : assert(false);
118 : return "";
119 : }
120 :
121 53892 : std::string PeerCloseManager::GetEventName(EventType eventType) const {
122 53892 : switch (eventType) {
123 0 : case EVENT_NONE:
124 0 : return "NONE";
125 10169 : case CLOSE:
126 10169 : return "CLOSE";
127 5523 : case EOR_RECEIVED:
128 5523 : return "EOR_RECEIVED";
129 9694 : case MEMBERSHIP_REQUEST:
130 9694 : return "MEMBERSHIP_REQUEST";
131 25678 : case MEMBERSHIP_REQUEST_COMPLETE_CALLBACK:
132 25678 : return "MEMBERSHIP_REQUEST_COMPLETE_CALLBACK";
133 2829 : case TIMER_CALLBACK:
134 2829 : return "TIMER_CALLBACK";
135 : }
136 :
137 0 : return "";
138 : }
139 :
140 143193 : void PeerCloseManager::EnqueueEvent(Event *event) {
141 163723 : PEER_CLOSE_MANAGER_LOG("Enqueued event " <<
142 : GetEventName(event->event_type) <<
143 : ", graceful " << event->graceful <<
144 : ", family " << Address::FamilyToString(event->family));
145 143245 : event_queue_->Enqueue(event);
146 143441 : }
147 :
148 : // Trigger closure of an IPeer
149 : //
150 : // Graceful close_state_: NONE
151 : // RibIn Stale Marking and Ribout deletion close_state_: STALE
152 : // StateMachine restart and GR timer start close_state_: GR_TIMER
153 : //
154 : // Peer IsReady() in GR timer callback (or via reception of all EoRs)
155 : // RibIn Sweep and Ribout Generation close_state_: SWEEP
156 : // MembershipRequestCallback close_state_: NONE
157 : //
158 : // Peer not IsReady() in GR timer callback
159 : // If LLGR supported close_state_: LLGR_STALE
160 : // RibIn Stale marking with LLGR_STALE community close_state_: LLGR_TIMER
161 : //
162 : // Peer not IsReady() in LLGR timer callback
163 : // RibIn Delete close_state_: DELETE
164 : // MembershipRequestCallback close_state_: NONE
165 : //
166 : // Peer IsReady() in LLGR timer callback (or via reception of all EoRs)
167 : // RibIn Sweep close_state_: SWEEP
168 : // MembershipRequestCallback close_state_: NONE
169 : //
170 : // If LLGR is not supported
171 : // RibIn Delete close_state_: DELETE
172 : // MembershipRequestCallback close_state_: NONE
173 : //
174 : // Close() call during any state other than NONE and DELETE
175 : // Cancel GR timer and restart GR Closure all over again
176 : //
177 : // NonGraceful close_state_ = * (except DELETE)
178 : // A. RibIn deletion and Ribout deletion close_state_ = DELETE
179 : // B. MembershipRequestCallback => Peers delete/StateMachine restart
180 : // close_state_ = NONE
181 : //
182 : // If Close is restarted, account for GR timer's elapsed time.
183 : //
184 : // Use graceful as true to close gracefully.
185 20921 : void PeerCloseManager::Close(bool graceful) {
186 20921 : EnqueueEvent(new Event(CLOSE, graceful));
187 20926 : }
188 :
189 20926 : void PeerCloseManager::Close(Event *event) {
190 : // Note down non-graceful close trigger. Once non-graceful closure is
191 : // triggered, it should remain so until close process is complete. Further
192 : // graceful closure calls until then should remain non-graceful.
193 20926 : graceful_ &= event->graceful;
194 20926 : CloseInternal();
195 20926 : }
196 :
197 21461 : void PeerCloseManager::CloseInternal() {
198 21461 : stats_.close++;
199 :
200 : // Ignore nested closures
201 21461 : if (close_again_) {
202 4 : PEER_CLOSE_MANAGER_LOG("Nested close calls ignored");
203 4 : return;
204 : }
205 :
206 21457 : switch (state_) {
207 19897 : case NONE:
208 19897 : stats_.ResetRouteStats();
209 19897 : ProcessClosure();
210 19897 : break;
211 :
212 339 : case GR_TIMER:
213 465 : PEER_CLOSE_MANAGER_LOG("Nested close: Restart GR");
214 339 : close_again_ = true;
215 339 : stats_.nested++;
216 339 : gr_elapsed_ += gr_timer_->GetElapsedTime();
217 339 : CloseComplete();
218 339 : break;
219 :
220 196 : case LLGR_TIMER:
221 196 : PEER_CLOSE_MANAGER_LOG("Nested close: Restart LLGR");
222 196 : close_again_ = true;
223 196 : stats_.nested++;
224 196 : llgr_elapsed_ += gr_timer_->GetElapsedTime();
225 196 : CloseComplete();
226 196 : break;
227 :
228 1025 : case STALE:
229 : case LLGR_STALE:
230 : case SWEEP:
231 : case DELETE:
232 1025 : PEER_CLOSE_MANAGER_LOG("Nested close");
233 1025 : close_again_ = true;
234 1025 : stats_.nested++;
235 1025 : break;
236 : }
237 : }
238 :
239 14772 : void PeerCloseManager::ProcessEORMarkerReceived(Address::Family family) {
240 14772 : EnqueueEvent(new Event(EOR_RECEIVED, family));
241 14773 : }
242 :
243 14773 : void PeerCloseManager::ProcessEORMarkerReceived(Event *event) {
244 14773 : if ((state_ == GR_TIMER || state_ == LLGR_TIMER) && !families_.empty()) {
245 1832 : if (event->family == Address::UNSPEC) {
246 40 : families_.clear();
247 : } else {
248 1792 : families_.erase(event->family);
249 : }
250 :
251 : // Start the timer if all EORs have been received.
252 1832 : if (families_.empty())
253 1224 : StartRestartTimer(0);
254 : }
255 14773 : }
256 :
257 : // Process RibIn during peer closure.
258 2680 : void PeerCloseManager::StartRestartTimer(int time) {
259 2680 : gr_timer_->Cancel();
260 2944 : PEER_CLOSE_MANAGER_LOG("GR Timer started to fire after " << time/1000 <<
261 : " seconds");
262 2680 : gr_timer_->Start(time,
263 : boost::bind(&PeerCloseManager::RestartTimerCallback, this));
264 2680 : }
265 :
266 2832 : bool PeerCloseManager::RestartTimerCallback() {
267 2832 : CHECK_CONCURRENCY("timer::TimerTask");
268 2831 : EnqueueEvent(new Event(TIMER_CALLBACK));
269 2833 : return false;
270 : }
271 :
272 2833 : void PeerCloseManager::RestartTimerCallback(Event *event) {
273 2833 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
274 :
275 2943 : PEER_CLOSE_MANAGER_LOG("GR Timer callback started");
276 2833 : if (state_ != GR_TIMER && state_ != LLGR_TIMER)
277 960 : return;
278 :
279 1873 : if (peer_close_->IsReady() && !families_.empty()) {
280 : // Fake reception of all EORs.
281 204 : for (IPeerClose::Families::iterator i = families_.begin(), next = i;
282 408 : i != families_.end(); i = next) {
283 204 : next++;
284 216 : PEER_CLOSE_MANAGER_LOG("Simulate EoR reception for family " << *i);
285 204 : peer_close_->ReceiveEndOfRIB(*i);
286 : }
287 : } else {
288 1669 : ProcessClosure();
289 : }
290 : }
291 :
292 : // Route stale timer callback. If the peer has come back up, sweep routes for
293 : // those address families that are still active. Delete the rest
294 21566 : void PeerCloseManager::ProcessClosure() {
295 : // If the peer is back up and this address family is still supported,
296 : // sweep old paths which may not have come back in the new session
297 21566 : switch (state_) {
298 19897 : case NONE:
299 19897 : if (!graceful_ || !peer_close_->IsCloseGraceful()) {
300 19669 : MOVE_TO_STATE(DELETE);
301 18870 : stats_.deletes++;
302 : } else {
303 1222 : MOVE_TO_STATE(STALE);
304 1027 : stats_.stale++;
305 1027 : StaleNotify();
306 1027 : return;
307 : }
308 18870 : break;
309 1104 : case GR_TIMER:
310 1104 : if (peer_close_->IsReady()) {
311 746 : MOVE_TO_STATE(SWEEP);
312 706 : gr_elapsed_ = 0;
313 706 : llgr_elapsed_ = 0;
314 706 : stats_.sweep++;
315 706 : break;
316 : }
317 398 : if (peer_close_->IsCloseLongLivedGraceful()) {
318 308 : MOVE_TO_STATE(LLGR_STALE);
319 279 : stats_.llgr_stale++;
320 279 : peer_close_->LongLivedGracefulRestartStale();
321 279 : break;
322 : }
323 119 : MOVE_TO_STATE(DELETE);
324 119 : stats_.deletes++;
325 119 : break;
326 :
327 565 : case LLGR_TIMER:
328 565 : if (peer_close_->IsReady()) {
329 318 : MOVE_TO_STATE(SWEEP);
330 318 : gr_elapsed_ = 0;
331 318 : llgr_elapsed_ = 0;
332 318 : stats_.sweep++;
333 318 : break;
334 : }
335 276 : MOVE_TO_STATE(DELETE);
336 247 : stats_.deletes++;
337 247 : break;
338 :
339 0 : case STALE:
340 : case LLGR_STALE:
341 : case SWEEP:
342 : case DELETE:
343 0 : assert(false);
344 : return;
345 : }
346 :
347 20539 : if (state_ == DELETE)
348 19236 : peer_close_->CustomClose();
349 20539 : MembershipRequest();
350 : }
351 :
352 1374 : void PeerCloseManager::CloseComplete() {
353 1540 : MOVE_TO_STATE(NONE);
354 1374 : gr_timer_->Cancel();
355 1374 : families_.clear();
356 1374 : stats_.init++;
357 :
358 : // Nested closures trigger fresh GR
359 1374 : if (close_again_) {
360 535 : close_again_ = false;
361 535 : CloseInternal();
362 : }
363 1374 : }
364 :
365 1415 : bool PeerCloseManager::AssertSweepState(bool do_assert) {
366 1415 : bool check = (state_ == SWEEP);
367 1415 : if (do_assert)
368 647 : assert(check);
369 1415 : return check;
370 : }
371 :
372 95126 : bool PeerCloseManager::AssertMembershipManagerInUse(bool do_assert) {
373 95126 : bool check = false;
374 181500 : check |= (state_ == STALE || state_ == LLGR_STALE || state_ == SWEEP ||
375 86374 : state_ == DELETE);
376 95126 : check |= (membership_state_ == MEMBERSHIP_IN_USE);
377 95126 : check |= (membership_req_pending_ > 0);
378 95126 : if (do_assert)
379 93782 : assert(check);
380 95126 : return check;
381 : }
382 :
383 22969 : bool PeerCloseManager::AssertMembershipState(bool do_assert) {
384 22969 : bool check = (membership_state_ != MEMBERSHIP_IN_USE);
385 22969 : if (do_assert)
386 20301 : assert(check);
387 22969 : return check;
388 : }
389 :
390 21178 : bool PeerCloseManager::AssertMembershipReqCount(bool do_assert) {
391 21178 : bool check = !membership_req_pending_;
392 21178 : if (do_assert)
393 20242 : assert(check);
394 21178 : return check;
395 : }
396 :
397 1415 : void PeerCloseManager::TriggerSweepStateActions() {
398 1415 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
399 1415 : if (!AssertSweepState())
400 576 : return;
401 :
402 : // Notify clients to trigger sweep as appropriate.
403 839 : peer_close_->GracefulRestartSweep();
404 :
405 : // Reset MembershipUse state after client has been notified above.
406 839 : set_membership_state(MEMBERSHIP_NONE);
407 839 : CloseComplete();
408 : }
409 :
410 : // Notify clients about entering Stale event.
411 1027 : void PeerCloseManager::StaleNotify() {
412 1027 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
413 :
414 1027 : peer_close_->GracefulRestartStale();
415 1027 : if (!AssertMembershipState())
416 48 : return;
417 979 : MembershipRequest(NULL);
418 : }
419 :
420 19418 : bool PeerCloseManager::CanUseMembershipManager() const {
421 19418 : return peer_close_->peer()->CanUseMembershipManager();
422 : }
423 :
424 20242 : void PeerCloseManager::GetRegisteredRibs(std::list<BgpTable *> *tables) {
425 20242 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
426 20242 : mgr->GetRegisteredRibs(peer_close_->peer(), tables);
427 20242 : }
428 :
429 83377 : bool PeerCloseManager::IsRegistered(BgpTable *table) const {
430 83377 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
431 83377 : return mgr->IsRegistered(peer_close_->peer(), table);
432 : }
433 :
434 73398 : void PeerCloseManager::Unregister(BgpTable *table) {
435 73398 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
436 73398 : mgr->Unregister(peer_close_->peer(), table);
437 73398 : }
438 :
439 3804 : void PeerCloseManager::WalkRibIn(BgpTable *table) {
440 3804 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
441 3804 : mgr->WalkRibIn(peer_close_->peer(), table);
442 3804 : }
443 :
444 4372 : void PeerCloseManager::UnregisterRibOut(BgpTable *table) {
445 4372 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
446 4372 : mgr->UnregisterRibOut(peer_close_->peer(), table);
447 4372 : }
448 :
449 4012 : bool PeerCloseManager::IsRibInRegistered(BgpTable *table) const {
450 4012 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
451 4012 : return mgr->IsRibInRegistered(peer_close_->peer(), table);
452 : }
453 :
454 1803 : void PeerCloseManager::UnregisterRibIn(BgpTable *table) {
455 1803 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
456 1803 : mgr->UnregisterRibIn(peer_close_->peer(), table);
457 1803 : }
458 :
459 21942 : void PeerCloseManager::MembershipRequest() {
460 21942 : if (!AssertMembershipState())
461 848 : return;
462 :
463 : // Pause if membership manager is not ready for usage.
464 21094 : if (!CanUseMembershipManager()) {
465 895 : set_membership_state(MEMBERSHIP_IN_WAIT);
466 938 : PEER_CLOSE_MANAGER_LOG("Wait for membership manager availability");
467 895 : return;
468 : }
469 20199 : set_membership_state(MEMBERSHIP_IN_USE);
470 20199 : EnqueueEvent(new Event(MEMBERSHIP_REQUEST));
471 : }
472 :
473 21178 : void PeerCloseManager::MembershipRequest(Event *evnet) {
474 21178 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
475 :
476 21178 : set_membership_state(MEMBERSHIP_IN_USE);
477 21178 : if (!AssertMembershipReqCount())
478 10853 : return;
479 20730 : membership_req_pending_++;
480 20730 : std::list<BgpTable *> tables;
481 20730 : GetRegisteredRibs(&tables);
482 :
483 20730 : if (tables.empty()) {
484 10405 : assert(MembershipRequestCallback(NULL));
485 10405 : return;
486 : }
487 :
488 : // Account for extra increment above.
489 10325 : membership_req_pending_--;
490 178055 : BOOST_FOREACH(BgpTable *table, tables) {
491 83865 : membership_req_pending_++;
492 83865 : if (IsRegistered(table)) {
493 79608 : if (state_ == PeerCloseManager::DELETE) {
494 100108 : PEER_CLOSE_MANAGER_TABLE_LOG(
495 : "MembershipManager::Unregister");
496 73517 : Unregister(table);
497 6091 : } else if (state_ == PeerCloseManager::SWEEP) {
498 3668 : PEER_CLOSE_MANAGER_TABLE_LOG("MembershipManager::WalkRibIn");
499 1657 : WalkRibIn(table);
500 : } else {
501 11684 : PEER_CLOSE_MANAGER_TABLE_LOG(
502 : "MembershipManager::UnregisterRibOut");
503 4434 : UnregisterRibOut(table);
504 : }
505 : } else {
506 4257 : assert(IsRibInRegistered(table));
507 4257 : if (state_ == PeerCloseManager::DELETE) {
508 5031 : PEER_CLOSE_MANAGER_TABLE_LOG(
509 : "MembershipManager::UnregisterRibIn");
510 1922 : UnregisterRibIn(table);
511 : } else {
512 6125 : PEER_CLOSE_MANAGER_TABLE_LOG("MembershipManager::WalkRibIn");
513 2335 : WalkRibIn(table);
514 : }
515 : }
516 : }
517 20730 : }
518 :
519 84468 : void PeerCloseManager::MembershipRequestCallback() {
520 84468 : EnqueueEvent(new Event(MEMBERSHIP_REQUEST_COMPLETE_CALLBACK));
521 84706 : }
522 :
523 : // Close process for this peer in terms of walking RibIns and RibOuts are
524 : // complete. Do the final cleanups necessary and notify interested party
525 : //
526 : // Retrun true if we are done using membership manager, false otherwise.
527 95126 : bool PeerCloseManager::MembershipRequestCallback(Event *event) {
528 95126 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
529 :
530 95126 : bool result = false;
531 113727 : PEER_CLOSE_MANAGER_LOG("MembershipRequestCallback");
532 :
533 95126 : if (!AssertMembershipManagerInUse())
534 0 : return result;
535 95126 : if (--membership_req_pending_)
536 73540 : return result;
537 :
538 : // Indicate to the caller that we are done using the membership manager.
539 21586 : result = true;
540 :
541 21586 : if (state_ == DELETE) {
542 19543 : MOVE_TO_STATE(NONE);
543 18715 : peer_close_->Delete();
544 18715 : gr_elapsed_ = 0;
545 18715 : llgr_elapsed_ = 0;
546 18715 : stats_.init++;
547 18715 : close_again_ = false;
548 18715 : graceful_ = true;
549 18715 : set_membership_state(MEMBERSHIP_NONE);
550 18715 : return result;
551 : }
552 :
553 : // Process nested closures.
554 2871 : if (close_again_) {
555 0 : set_membership_state(MEMBERSHIP_NONE);
556 0 : CloseComplete();
557 :
558 : // Nested closure can make membership manager to be in use again.
559 0 : return membership_state_ != MEMBERSHIP_IN_USE;
560 : }
561 :
562 : // If any GR stale timer has to be launched, then to wait for some time
563 : // hoping for the peer (and the paths) to come back up.
564 2871 : if (state_ == STALE) {
565 1075 : peer_close_->CloseComplete();
566 1270 : MOVE_TO_STATE(GR_TIMER);
567 1075 : peer_close_->GetGracefulRestartFamilies(&families_);
568 :
569 : // Offset restart time with elapsed time during nested closures.
570 1075 : int time = peer_close_->GetGracefulRestartTime() * 1000;
571 1075 : time -= gr_elapsed_;
572 1075 : if (time < 0)
573 0 : time = 0;
574 1075 : StartRestartTimer(time);
575 1075 : stats_.gr_timer++;
576 1075 : set_membership_state(MEMBERSHIP_NONE);
577 1075 : return result;
578 : }
579 :
580 : // From LLGR_STALE state, switch to LLGR_TIMER state. Typically this would
581 : // be a very long timer, and we expect to receive EORs before this timer
582 : // expires.
583 : // Just like for GRSTALE in the above case, before moving to LLGR_TIMER and
584 : // starting LLGR_TIMER, we can check if the peer can come back up.
585 1796 : if (state_ == LLGR_STALE) {
586 410 : MOVE_TO_STATE(LLGR_TIMER);
587 381 : peer_close_->CloseComplete();
588 381 : peer_close_->GetLongLivedGracefulRestartFamilies(&families_);
589 :
590 : // Offset restart time with elapsed time during nested closures.
591 381 : int time = peer_close_->GetLongLivedGracefulRestartTime() * 1000;
592 381 : time -= llgr_elapsed_;
593 381 : if (time < 0)
594 0 : time = 0;
595 381 : StartRestartTimer(time);
596 381 : stats_.llgr_timer++;
597 381 : set_membership_state(MEMBERSHIP_NONE);
598 381 : return result;
599 : }
600 :
601 1415 : TriggerSweepStateActions();
602 1415 : return result;
603 : }
604 :
605 62599 : void PeerCloseManager::FillRouteCloseInfo(PeerCloseInfo *close_info) const {
606 62599 : std::map<std::string, PeerCloseRouteInfo> route_stats;
607 :
608 688589 : for (int i = 0; i < Address::NUM_FAMILIES; i++) {
609 625990 : if (!stats_.route_stats[i].IsSet())
610 471851 : continue;
611 154139 : PeerCloseRouteInfo route_info;
612 154139 : route_info.set_staled(stats_.route_stats[i].staled);
613 154139 : route_info.set_llgr_staled(stats_.route_stats[i].llgr_staled);
614 154139 : route_info.set_refreshed(stats_.route_stats[i].refreshed);
615 154139 : route_info.set_fresh(stats_.route_stats[i].fresh);
616 154139 : route_info.set_deleted(stats_.route_stats[i].deleted);
617 154139 : route_stats[Address::FamilyToString(static_cast<Address::Family>(i))] = route_info;
618 154139 : }
619 :
620 62599 : if (!route_stats.empty())
621 61741 : close_info->set_route_stats(route_stats);
622 62599 : }
623 :
624 62599 : BgpNeighborResp *PeerCloseManager::FillCloseInfo(BgpNeighborResp *resp) const {
625 62599 : PeerCloseInfo peer_close_info;
626 62599 : peer_close_info.set_state(GetStateName(state_));
627 62599 : peer_close_info.set_membership_state(
628 125198 : GetMembershipStateName(membership_state_));
629 62599 : peer_close_info.set_close_again(close_again_);
630 62599 : peer_close_info.set_graceful(graceful_);
631 62599 : peer_close_info.set_init(stats_.init);
632 62599 : peer_close_info.set_close(stats_.close);
633 62599 : peer_close_info.set_nested(stats_.nested);
634 62599 : peer_close_info.set_deletes(stats_.deletes);
635 62599 : peer_close_info.set_stale(stats_.stale);
636 62599 : peer_close_info.set_llgr_stale(stats_.llgr_stale);
637 62599 : peer_close_info.set_sweep(stats_.sweep);
638 62599 : peer_close_info.set_gr_timer(stats_.gr_timer);
639 62599 : peer_close_info.set_llgr_timer(stats_.llgr_timer);
640 62599 : FillRouteCloseInfo(&peer_close_info);
641 :
642 62599 : resp->set_peer_close_info(peer_close_info);
643 :
644 62599 : return resp;
645 62599 : }
646 :
647 216823 : void PeerCloseManager::UpdateRouteStats(Address::Family family,
648 : const BgpPath *old_path, uint32_t path_flags) const {
649 216823 : if (state_ == NONE)
650 197006 : return;
651 :
652 19817 : if (!old_path)
653 53 : stats_.route_stats[family].fresh++;
654 19764 : else if (old_path->IsStale() && !(path_flags & BgpPath::Stale))
655 3361 : stats_.route_stats[family].refreshed++;
656 : }
657 :
658 100673 : bool PeerCloseManager::MembershipPathCallback(DBTablePartBase *root,
659 : BgpRoute *rt, BgpPath *path) {
660 100673 : CHECK_CONCURRENCY("db::DBTable");
661 100671 : DBRequest::DBOperation oper = DBRequest::DB_ENTRY_INVALID;
662 100671 : BgpAttrPtr attrs;
663 :
664 100671 : BgpTable *table = static_cast<BgpTable *>(root->parent());
665 100671 : assert(table);
666 :
667 100671 : uint32_t stale = 0;
668 :
669 100671 : switch (state_) {
670 0 : case NONE:
671 : case GR_TIMER:
672 : case LLGR_TIMER:
673 0 : return false;
674 :
675 6009 : case SWEEP:
676 :
677 : // Stale paths must be deleted.
678 6009 : if (!path->IsStale() && !path->IsLlgrStale())
679 2870 : return false;
680 3139 : if (path->IsStale()) {
681 3139 : path->ResetStale();
682 3139 : table->UpdateStalePathCount(-1);
683 : }
684 3142 : if (path->IsLlgrStale()) {
685 0 : path->ResetLlgrStale();
686 0 : table->UpdateLlgrStalePathCount(-1);
687 : }
688 3142 : oper = DBRequest::DB_ENTRY_DELETE;
689 3142 : attrs = NULL;
690 3139 : stats_.route_stats[table->family()].deleted++;
691 3142 : break;
692 :
693 76678 : case DELETE:
694 :
695 : // This path must be deleted. Hence attr is not required.
696 76678 : oper = DBRequest::DB_ENTRY_DELETE;
697 76678 : attrs = NULL;
698 76682 : stats_.route_stats[table->family()].deleted++;
699 76717 : break;
700 :
701 14750 : case STALE:
702 :
703 : // We do not support GR for multicast routes (yet).
704 29500 : if ((table->family() == Address::ERMVPN) ||
705 14750 : (table->family() == Address::MVPN)) {
706 0 : oper = DBRequest::DB_ENTRY_DELETE;
707 0 : attrs = NULL;
708 0 : stats_.route_stats[table->family()].deleted++;
709 0 : break;
710 : }
711 :
712 : // If path is already marked as stale, then there is no need to
713 : // process again. This can happen if the session flips while in
714 : // GR_TIMER state.
715 14750 : if (path->IsStale())
716 3319 : return false;
717 :
718 : // This path must be marked for staling. Update the local
719 : // preference and update the route accordingly.
720 11431 : oper = DBRequest::DB_ENTRY_ADD_CHANGE;
721 11431 : attrs = path->GetAttr();
722 11435 : stale = BgpPath::Stale;
723 11435 : stats_.route_stats[table->family()].staled++;
724 11437 : break;
725 :
726 3234 : case LLGR_STALE:
727 :
728 : // If the path has NO_LLGR community, DELETE it.
729 3234 : if (path->GetAttr()->community() &&
730 0 : path->GetAttr()->community()->ContainsValue(
731 : CommunityType::NoLlgr)) {
732 0 : oper = DBRequest::DB_ENTRY_DELETE;
733 0 : attrs = NULL;
734 0 : stats_.route_stats[table->family()].deleted++;
735 0 : break;
736 : }
737 :
738 : // If path is already marked as llgr_stale, then there is no
739 : // need to process again. This can happen if the session flips
740 : // while in LLGR_TIMER state.
741 3234 : if (path->IsLlgrStale())
742 0 : return false;
743 :
744 3234 : attrs = path->GetAttr();
745 3236 : stale = BgpPath::LlgrStale;
746 3236 : oper = DBRequest::DB_ENTRY_ADD_CHANGE;
747 3236 : stats_.route_stats[table->family()].llgr_staled++;
748 3236 : break;
749 : }
750 :
751 : // Feed the route modify/delete request to the table input process.
752 283578 : return table->InputCommon(root, rt, path, peer_close_->peer(), NULL, oper,
753 94526 : attrs, path->GetPathId(), path->GetFlags() | stale, path->GetLabel(),
754 94524 : path->GetL3Label());
755 100712 : }
756 :
757 : //
758 : // Handler for an Event.
759 : //
760 143452 : bool PeerCloseManager::EventCallback(Event *event) {
761 143452 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
762 : bool result;
763 :
764 143452 : switch (event->event_type) {
765 0 : case EVENT_NONE:
766 0 : break;
767 20926 : case CLOSE:
768 20926 : Close(event);
769 20926 : break;
770 14773 : case EOR_RECEIVED:
771 14773 : ProcessEORMarkerReceived(event);
772 14773 : break;
773 20199 : case MEMBERSHIP_REQUEST:
774 20199 : MembershipRequest(event);
775 20199 : break;
776 84721 : case MEMBERSHIP_REQUEST_COMPLETE_CALLBACK:
777 84721 : result = MembershipRequestCallback(event);
778 :
779 : // Notify clients if we are no longer using the membership mgr.
780 84721 : if (result)
781 11181 : peer_close_->MembershipRequestCallbackComplete();
782 84721 : break;
783 2833 : case TIMER_CALLBACK:
784 2833 : RestartTimerCallback(event);
785 2833 : break;
786 : }
787 :
788 143452 : delete event;
789 143452 : return true;
790 : }
|