Line data Source code
1 : /*
2 : * Copyright (c) 2013 Juniper Networks, Inc. All rights reserved.
3 : */
4 :
5 : #include "bgp/peer_close_manager.h"
6 :
7 :
8 : #include <list>
9 : #include <map>
10 :
11 : #include <boost/foreach.hpp>
12 :
13 : #include "base/task_annotations.h"
14 : #include "bgp/bgp_log.h"
15 : #include "bgp/bgp_membership.h"
16 : #include "bgp/bgp_peer_types.h"
17 : #include "bgp/bgp_route.h"
18 : #include "bgp/bgp_server.h"
19 : #include "bgp/routing-instance/routing_instance.h"
20 : #include "net/community_type.h"
21 :
22 : #define PEER_CLOSE_MANAGER_LOG(msg) \
23 : BGP_LOG_PEER(Event, peer_close_->peer(), SandeshLevel::SYS_INFO, \
24 : BGP_LOG_FLAG_ALL, BGP_PEER_DIR_NA, \
25 : "PeerCloseManager: State " << GetStateName(state_) << \
26 : ", MembershipState: " << GetMembershipStateName(membership_state_) << \
27 : ", MembershipReqPending: " << membership_req_pending_ << \
28 : ", CloseAgain?: " << (close_again_ ? "Yes" : "No") << ": " << msg);
29 :
30 : #define PEER_CLOSE_MANAGER_TABLE_LOG(msg) \
31 : BGP_LOG_PEER_TABLE(peer_close_->peer(), SandeshLevel::SYS_INFO, \
32 : BGP_LOG_FLAG_ALL, table, \
33 : "PeerCloseManager: State " << GetStateName(state_) << \
34 : ", MembershipState: " << GetMembershipStateName(membership_state_) << \
35 : ", MembershipReqPending: " << membership_req_pending_ << \
36 : ", CloseAgain?: " << (close_again_ ? "Yes" : "No") << ": " << msg);
37 :
38 : #define MOVE_TO_STATE(state) \
39 : do { \
40 : assert(state_ != state); \
41 : PEER_CLOSE_MANAGER_LOG("Move to state " << GetStateName(state)); \
42 : state_ = state; \
43 : } while (false)
44 :
45 : // Create an instance of PeerCloseManager with back reference to parent IPeer
46 8064 : PeerCloseManager::PeerCloseManager(IPeerClose *peer_close,
47 8064 : boost::asio::io_context *io_service) :
48 8064 : peer_close_(peer_close), gr_timer_(NULL),
49 16128 : event_queue_(new WorkQueue<Event *>(
50 24192 : TaskScheduler::GetInstance()->GetTaskId(
51 8064 : peer_close_->GetTaskName()),
52 8064 : peer_close_->GetTaskInstance(),
53 8064 : boost::bind(&PeerCloseManager::EventCallback, this, _1))),
54 8064 : state_(NONE), close_again_(false), graceful_(true), gr_elapsed_(0),
55 16128 : llgr_elapsed_(0), membership_state_(MEMBERSHIP_NONE) {
56 8064 : stats_.init++;
57 8064 : membership_req_pending_ = 0;
58 8064 : gr_timer_ = TimerManager::CreateTimer(*io_service,
59 : "Graceful Restart Timer");
60 8064 : }
61 :
62 : // Create an instance of PeerCloseManager with back reference to parent IPeer
63 20411 : PeerCloseManager::PeerCloseManager(IPeerClose *peer_close) :
64 20411 : peer_close_(peer_close), gr_timer_(NULL),
65 40822 : event_queue_(new WorkQueue<Event *>(
66 61233 : TaskScheduler::GetInstance()->GetTaskId(
67 20411 : peer_close_->GetTaskName()),
68 20411 : peer_close_->GetTaskInstance(),
69 20411 : boost::bind(&PeerCloseManager::EventCallback, this, _1))),
70 20411 : state_(NONE), close_again_(false), graceful_(true), gr_elapsed_(0),
71 40822 : llgr_elapsed_(0), membership_state_(MEMBERSHIP_NONE) {
72 20411 : stats_.init++;
73 20411 : membership_req_pending_ = 0;
74 20411 : if (peer_close->peer() && peer_close->peer()->server()) {
75 16596 : gr_timer_ =
76 16596 : TimerManager::CreateTimer(*peer_close->peer()->server()->ioservice(),
77 : "Graceful Restart Timer");
78 : }
79 20411 : }
80 :
81 45866 : PeerCloseManager::~PeerCloseManager() {
82 28475 : event_queue_->Shutdown();
83 28475 : TimerManager::DeleteTimer(gr_timer_);
84 45866 : }
85 :
86 226080 : std::string PeerCloseManager::GetStateName(State state) const {
87 226080 : switch (state) {
88 32479 : case NONE:
89 32479 : return "NONE";
90 68098 : case GR_TIMER:
91 68098 : return "GR_TIMER";
92 19404 : case STALE:
93 19404 : return "STALE";
94 6051 : case LLGR_STALE:
95 6051 : return "LLGR_STALE";
96 7254 : case LLGR_TIMER:
97 7254 : return "LLGR_TIMER";
98 10469 : case SWEEP:
99 10469 : return "SWEEP";
100 82325 : case DELETE:
101 82325 : return "DELETE";
102 : }
103 0 : assert(false);
104 : return "";
105 : }
106 :
107 204172 : std::string PeerCloseManager::GetMembershipStateName(
108 : MembershipState state) const {
109 204172 : switch (state) {
110 91728 : case MEMBERSHIP_NONE:
111 91728 : return "NONE";
112 108089 : case MEMBERSHIP_IN_USE:
113 108089 : return "IN_USE";
114 4356 : case MEMBERSHIP_IN_WAIT:
115 4356 : return "IN_WAIT";
116 : }
117 0 : assert(false);
118 : return "";
119 : }
120 :
121 53734 : std::string PeerCloseManager::GetEventName(EventType eventType) const {
122 53734 : switch (eventType) {
123 0 : case EVENT_NONE:
124 0 : return "NONE";
125 10127 : case CLOSE:
126 10127 : return "CLOSE";
127 5543 : case EOR_RECEIVED:
128 5543 : return "EOR_RECEIVED";
129 9650 : case MEMBERSHIP_REQUEST:
130 9650 : return "MEMBERSHIP_REQUEST";
131 25639 : case MEMBERSHIP_REQUEST_COMPLETE_CALLBACK:
132 25639 : return "MEMBERSHIP_REQUEST_COMPLETE_CALLBACK";
133 2775 : case TIMER_CALLBACK:
134 2775 : return "TIMER_CALLBACK";
135 : }
136 :
137 0 : return "";
138 : }
139 :
140 143483 : void PeerCloseManager::EnqueueEvent(Event *event) {
141 164027 : PEER_CLOSE_MANAGER_LOG("Enqueued event " <<
142 : GetEventName(event->event_type) <<
143 : ", graceful " << event->graceful <<
144 : ", family " << Address::FamilyToString(event->family));
145 143517 : event_queue_->Enqueue(event);
146 143675 : }
147 :
148 : // Trigger closure of an IPeer
149 : //
150 : // Graceful close_state_: NONE
151 : // RibIn Stale Marking and Ribout deletion close_state_: STALE
152 : // StateMachine restart and GR timer start close_state_: GR_TIMER
153 : //
154 : // Peer IsReady() in GR timer callback (or via reception of all EoRs)
155 : // RibIn Sweep and Ribout Generation close_state_: SWEEP
156 : // MembershipRequestCallback close_state_: NONE
157 : //
158 : // Peer not IsReady() in GR timer callback
159 : // If LLGR supported close_state_: LLGR_STALE
160 : // RibIn Stale marking with LLGR_STALE community close_state_: LLGR_TIMER
161 : //
162 : // Peer not IsReady() in LLGR timer callback
163 : // RibIn Delete close_state_: DELETE
164 : // MembershipRequestCallback close_state_: NONE
165 : //
166 : // Peer IsReady() in LLGR timer callback (or via reception of all EoRs)
167 : // RibIn Sweep close_state_: SWEEP
168 : // MembershipRequestCallback close_state_: NONE
169 : //
170 : // If LLGR is not supported
171 : // RibIn Delete close_state_: DELETE
172 : // MembershipRequestCallback close_state_: NONE
173 : //
174 : // Close() call during any state other than NONE and DELETE
175 : // Cancel GR timer and restart GR Closure all over again
176 : //
177 : // NonGraceful close_state_ = * (except DELETE)
178 : // A. RibIn deletion and Ribout deletion close_state_ = DELETE
179 : // B. MembershipRequestCallback => Peers delete/StateMachine restart
180 : // close_state_ = NONE
181 : //
182 : // If Close is restarted, account for GR timer's elapsed time.
183 : //
184 : // Use graceful as true to close gracefully.
185 20908 : void PeerCloseManager::Close(bool graceful) {
186 20908 : EnqueueEvent(new Event(CLOSE, graceful));
187 20914 : }
188 :
189 20914 : void PeerCloseManager::Close(Event *event) {
190 : // Note down non-graceful close trigger. Once non-graceful closure is
191 : // triggered, it should remain so until close process is complete. Further
192 : // graceful closure calls until then should remain non-graceful.
193 20914 : graceful_ &= event->graceful;
194 20914 : CloseInternal();
195 20914 : }
196 :
197 21447 : void PeerCloseManager::CloseInternal() {
198 21447 : stats_.close++;
199 :
200 : // Ignore nested closures
201 21447 : if (close_again_) {
202 4 : PEER_CLOSE_MANAGER_LOG("Nested close calls ignored");
203 4 : return;
204 : }
205 :
206 21443 : switch (state_) {
207 19894 : case NONE:
208 19894 : stats_.ResetRouteStats();
209 19894 : ProcessClosure();
210 19894 : break;
211 :
212 336 : case GR_TIMER:
213 462 : PEER_CLOSE_MANAGER_LOG("Nested close: Restart GR");
214 336 : close_again_ = true;
215 336 : stats_.nested++;
216 336 : gr_elapsed_ += gr_timer_->GetElapsedTime();
217 336 : CloseComplete();
218 336 : break;
219 :
220 196 : case LLGR_TIMER:
221 196 : PEER_CLOSE_MANAGER_LOG("Nested close: Restart LLGR");
222 196 : close_again_ = true;
223 196 : stats_.nested++;
224 196 : llgr_elapsed_ += gr_timer_->GetElapsedTime();
225 196 : CloseComplete();
226 196 : break;
227 :
228 1017 : case STALE:
229 : case LLGR_STALE:
230 : case SWEEP:
231 : case DELETE:
232 1017 : PEER_CLOSE_MANAGER_LOG("Nested close");
233 1017 : close_again_ = true;
234 1017 : stats_.nested++;
235 1017 : break;
236 : }
237 : }
238 :
239 15024 : void PeerCloseManager::ProcessEORMarkerReceived(Address::Family family) {
240 15024 : EnqueueEvent(new Event(EOR_RECEIVED, family));
241 15028 : }
242 :
243 15028 : void PeerCloseManager::ProcessEORMarkerReceived(Event *event) {
244 15028 : if ((state_ == GR_TIMER || state_ == LLGR_TIMER) && !families_.empty()) {
245 1791 : if (event->family == Address::UNSPEC) {
246 40 : families_.clear();
247 : } else {
248 1751 : families_.erase(event->family);
249 : }
250 :
251 : // Start the timer if all EORs have been received.
252 1791 : if (families_.empty())
253 1182 : StartRestartTimer(0);
254 : }
255 15028 : }
256 :
257 : // Process RibIn during peer closure.
258 2594 : void PeerCloseManager::StartRestartTimer(int time) {
259 2594 : gr_timer_->Cancel();
260 2858 : PEER_CLOSE_MANAGER_LOG("GR Timer started to fire after " << time/1000 <<
261 : " seconds");
262 2594 : gr_timer_->Start(time,
263 : boost::bind(&PeerCloseManager::RestartTimerCallback, this));
264 2594 : }
265 :
266 2778 : bool PeerCloseManager::RestartTimerCallback() {
267 2778 : CHECK_CONCURRENCY("timer::TimerTask");
268 2777 : EnqueueEvent(new Event(TIMER_CALLBACK));
269 2779 : return false;
270 : }
271 :
272 2779 : void PeerCloseManager::RestartTimerCallback(Event *event) {
273 2779 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
274 :
275 2889 : PEER_CLOSE_MANAGER_LOG("GR Timer callback started");
276 2779 : if (state_ != GR_TIMER && state_ != LLGR_TIMER)
277 960 : return;
278 :
279 1819 : if (peer_close_->IsReady() && !families_.empty()) {
280 : // Fake reception of all EORs.
281 204 : for (IPeerClose::Families::iterator i = families_.begin(), next = i;
282 408 : i != families_.end(); i = next) {
283 204 : next++;
284 216 : PEER_CLOSE_MANAGER_LOG("Simulate EoR reception for family " << *i);
285 204 : peer_close_->ReceiveEndOfRIB(*i);
286 : }
287 : } else {
288 1615 : ProcessClosure();
289 : }
290 : }
291 :
292 : // Route stale timer callback. If the peer has come back up, sweep routes for
293 : // those address families that are still active. Delete the rest
294 21509 : void PeerCloseManager::ProcessClosure() {
295 : // If the peer is back up and this address family is still supported,
296 : // sweep old paths which may not have come back in the new session
297 21509 : switch (state_) {
298 19894 : case NONE:
299 19894 : if (!graceful_ || !peer_close_->IsCloseGraceful()) {
300 19710 : MOVE_TO_STATE(DELETE);
301 18911 : stats_.deletes++;
302 : } else {
303 1178 : MOVE_TO_STATE(STALE);
304 983 : stats_.stale++;
305 983 : StaleNotify();
306 983 : return;
307 : }
308 18911 : break;
309 1058 : case GR_TIMER:
310 1058 : if (peer_close_->IsReady()) {
311 696 : MOVE_TO_STATE(SWEEP);
312 656 : gr_elapsed_ = 0;
313 656 : llgr_elapsed_ = 0;
314 656 : stats_.sweep++;
315 656 : break;
316 : }
317 402 : if (peer_close_->IsCloseLongLivedGraceful()) {
318 314 : MOVE_TO_STATE(LLGR_STALE);
319 285 : stats_.llgr_stale++;
320 285 : peer_close_->LongLivedGracefulRestartStale();
321 285 : break;
322 : }
323 117 : MOVE_TO_STATE(DELETE);
324 117 : stats_.deletes++;
325 117 : break;
326 :
327 557 : case LLGR_TIMER:
328 557 : if (peer_close_->IsReady()) {
329 315 : MOVE_TO_STATE(SWEEP);
330 315 : gr_elapsed_ = 0;
331 315 : llgr_elapsed_ = 0;
332 315 : stats_.sweep++;
333 315 : break;
334 : }
335 271 : MOVE_TO_STATE(DELETE);
336 242 : stats_.deletes++;
337 242 : break;
338 :
339 0 : case STALE:
340 : case LLGR_STALE:
341 : case SWEEP:
342 : case DELETE:
343 0 : assert(false);
344 : return;
345 : }
346 :
347 20526 : if (state_ == DELETE)
348 19270 : peer_close_->CustomClose();
349 20526 : MembershipRequest();
350 : }
351 :
352 1330 : void PeerCloseManager::CloseComplete() {
353 1496 : MOVE_TO_STATE(NONE);
354 1330 : gr_timer_->Cancel();
355 1330 : families_.clear();
356 1330 : stats_.init++;
357 :
358 : // Nested closures trigger fresh GR
359 1330 : if (close_again_) {
360 533 : close_again_ = false;
361 533 : CloseInternal();
362 : }
363 1330 : }
364 :
365 1373 : bool PeerCloseManager::AssertSweepState(bool do_assert) {
366 1373 : bool check = (state_ == SWEEP);
367 1373 : if (do_assert)
368 605 : assert(check);
369 1373 : return check;
370 : }
371 :
372 95194 : bool PeerCloseManager::AssertMembershipManagerInUse(bool do_assert) {
373 95194 : bool check = false;
374 181717 : check |= (state_ == STALE || state_ == LLGR_STALE || state_ == SWEEP ||
375 86523 : state_ == DELETE);
376 95194 : check |= (membership_state_ == MEMBERSHIP_IN_USE);
377 95194 : check |= (membership_req_pending_ > 0);
378 95194 : if (do_assert)
379 93850 : assert(check);
380 95194 : return check;
381 : }
382 :
383 22942 : bool PeerCloseManager::AssertMembershipState(bool do_assert) {
384 22942 : bool check = (membership_state_ != MEMBERSHIP_IN_USE);
385 22942 : if (do_assert)
386 20287 : assert(check);
387 22942 : return check;
388 : }
389 :
390 21126 : bool PeerCloseManager::AssertMembershipReqCount(bool do_assert) {
391 21126 : bool check = !membership_req_pending_;
392 21126 : if (do_assert)
393 20198 : assert(check);
394 21126 : return check;
395 : }
396 :
397 1373 : void PeerCloseManager::TriggerSweepStateActions() {
398 1373 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
399 1373 : if (!AssertSweepState())
400 576 : return;
401 :
402 : // Notify clients to trigger sweep as appropriate.
403 797 : peer_close_->GracefulRestartSweep();
404 :
405 : // Reset MembershipUse state after client has been notified above.
406 797 : set_membership_state(MEMBERSHIP_NONE);
407 797 : CloseComplete();
408 : }
409 :
410 : // Notify clients about entering Stale event.
411 983 : void PeerCloseManager::StaleNotify() {
412 983 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
413 :
414 983 : peer_close_->GracefulRestartStale();
415 983 : if (!AssertMembershipState())
416 48 : return;
417 935 : MembershipRequest(NULL);
418 : }
419 :
420 19448 : bool PeerCloseManager::CanUseMembershipManager() const {
421 19448 : return peer_close_->peer()->CanUseMembershipManager();
422 : }
423 :
424 20198 : void PeerCloseManager::GetRegisteredRibs(std::list<BgpTable *> *tables) {
425 20198 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
426 20198 : mgr->GetRegisteredRibs(peer_close_->peer(), tables);
427 20198 : }
428 :
429 83430 : bool PeerCloseManager::IsRegistered(BgpTable *table) const {
430 83430 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
431 83430 : return mgr->IsRegistered(peer_close_->peer(), table);
432 : }
433 :
434 73532 : void PeerCloseManager::Unregister(BgpTable *table) {
435 73532 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
436 73532 : mgr->Unregister(peer_close_->peer(), table);
437 73532 : }
438 :
439 3763 : void PeerCloseManager::WalkRibIn(BgpTable *table) {
440 3763 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
441 3763 : mgr->WalkRibIn(peer_close_->peer(), table);
442 3763 : }
443 :
444 4332 : void PeerCloseManager::UnregisterRibOut(BgpTable *table) {
445 4332 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
446 4332 : mgr->UnregisterRibOut(peer_close_->peer(), table);
447 4332 : }
448 :
449 3990 : bool PeerCloseManager::IsRibInRegistered(BgpTable *table) const {
450 3990 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
451 3990 : return mgr->IsRibInRegistered(peer_close_->peer(), table);
452 : }
453 :
454 1803 : void PeerCloseManager::UnregisterRibIn(BgpTable *table) {
455 1803 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
456 1803 : mgr->UnregisterRibIn(peer_close_->peer(), table);
457 1803 : }
458 :
459 21959 : void PeerCloseManager::MembershipRequest() {
460 21959 : if (!AssertMembershipState())
461 848 : return;
462 :
463 : // Pause if membership manager is not ready for usage.
464 21111 : if (!CanUseMembershipManager()) {
465 920 : set_membership_state(MEMBERSHIP_IN_WAIT);
466 993 : PEER_CLOSE_MANAGER_LOG("Wait for membership manager availability");
467 920 : return;
468 : }
469 20191 : set_membership_state(MEMBERSHIP_IN_USE);
470 20191 : EnqueueEvent(new Event(MEMBERSHIP_REQUEST));
471 : }
472 :
473 21126 : void PeerCloseManager::MembershipRequest(Event *evnet) {
474 21126 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
475 :
476 21126 : set_membership_state(MEMBERSHIP_IN_USE);
477 21126 : if (!AssertMembershipReqCount())
478 10868 : return;
479 20678 : membership_req_pending_++;
480 20678 : std::list<BgpTable *> tables;
481 20678 : GetRegisteredRibs(&tables);
482 :
483 20678 : if (tables.empty()) {
484 10420 : assert(MembershipRequestCallback(NULL));
485 10420 : return;
486 : }
487 :
488 : // Account for extra increment above.
489 10258 : membership_req_pending_--;
490 178078 : BOOST_FOREACH(BgpTable *table, tables) {
491 83910 : membership_req_pending_++;
492 83910 : if (IsRegistered(table)) {
493 79682 : if (state_ == PeerCloseManager::DELETE) {
494 100269 : PEER_CLOSE_MANAGER_TABLE_LOG(
495 : "MembershipManager::Unregister");
496 73649 : Unregister(table);
497 6033 : } else if (state_ == PeerCloseManager::SWEEP) {
498 3652 : PEER_CLOSE_MANAGER_TABLE_LOG("MembershipManager::WalkRibIn");
499 1637 : WalkRibIn(table);
500 : } else {
501 11606 : PEER_CLOSE_MANAGER_TABLE_LOG(
502 : "MembershipManager::UnregisterRibOut");
503 4396 : UnregisterRibOut(table);
504 : }
505 : } else {
506 4228 : assert(IsRibInRegistered(table));
507 4228 : if (state_ == PeerCloseManager::DELETE) {
508 5027 : PEER_CLOSE_MANAGER_TABLE_LOG(
509 : "MembershipManager::UnregisterRibIn");
510 1918 : UnregisterRibIn(table);
511 : } else {
512 6055 : PEER_CLOSE_MANAGER_TABLE_LOG("MembershipManager::WalkRibIn");
513 2310 : WalkRibIn(table);
514 : }
515 : }
516 : }
517 20678 : }
518 :
519 84572 : void PeerCloseManager::MembershipRequestCallback() {
520 84572 : EnqueueEvent(new Event(MEMBERSHIP_REQUEST_COMPLETE_CALLBACK));
521 84762 : }
522 :
523 : // Close process for this peer in terms of walking RibIns and RibOuts are
524 : // complete. Do the final cleanups necessary and notify interested party
525 : //
526 : // Retrun true if we are done using membership manager, false otherwise.
527 95194 : bool PeerCloseManager::MembershipRequestCallback(Event *event) {
528 95194 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
529 :
530 95194 : bool result = false;
531 113784 : PEER_CLOSE_MANAGER_LOG("MembershipRequestCallback");
532 :
533 95194 : if (!AssertMembershipManagerInUse())
534 0 : return result;
535 95194 : if (--membership_req_pending_)
536 73652 : return result;
537 :
538 : // Indicate to the caller that we are done using the membership manager.
539 21542 : result = true;
540 :
541 21542 : if (state_ == DELETE) {
542 19584 : MOVE_TO_STATE(NONE);
543 18756 : peer_close_->Delete();
544 18756 : gr_elapsed_ = 0;
545 18756 : llgr_elapsed_ = 0;
546 18756 : stats_.init++;
547 18756 : close_again_ = false;
548 18756 : graceful_ = true;
549 18756 : set_membership_state(MEMBERSHIP_NONE);
550 18756 : return result;
551 : }
552 :
553 : // Process nested closures.
554 2786 : if (close_again_) {
555 1 : set_membership_state(MEMBERSHIP_NONE);
556 1 : CloseComplete();
557 :
558 : // Nested closure can make membership manager to be in use again.
559 1 : return membership_state_ != MEMBERSHIP_IN_USE;
560 : }
561 :
562 : // If any GR stale timer has to be launched, then to wait for some time
563 : // hoping for the peer (and the paths) to come back up.
564 2785 : if (state_ == STALE) {
565 1031 : peer_close_->CloseComplete();
566 1226 : MOVE_TO_STATE(GR_TIMER);
567 1031 : peer_close_->GetGracefulRestartFamilies(&families_);
568 :
569 : // Offset restart time with elapsed time during nested closures.
570 1031 : int time = peer_close_->GetGracefulRestartTime() * 1000;
571 1031 : time -= gr_elapsed_;
572 1031 : if (time < 0)
573 0 : time = 0;
574 1031 : StartRestartTimer(time);
575 1031 : stats_.gr_timer++;
576 1031 : set_membership_state(MEMBERSHIP_NONE);
577 1031 : return result;
578 : }
579 :
580 : // From LLGR_STALE state, switch to LLGR_TIMER state. Typically this would
581 : // be a very long timer, and we expect to receive EORs before this timer
582 : // expires.
583 : // Just like for GRSTALE in the above case, before moving to LLGR_TIMER and
584 : // starting LLGR_TIMER, we can check if the peer can come back up.
585 1754 : if (state_ == LLGR_STALE) {
586 410 : MOVE_TO_STATE(LLGR_TIMER);
587 381 : peer_close_->CloseComplete();
588 381 : peer_close_->GetLongLivedGracefulRestartFamilies(&families_);
589 :
590 : // Offset restart time with elapsed time during nested closures.
591 381 : int time = peer_close_->GetLongLivedGracefulRestartTime() * 1000;
592 381 : time -= llgr_elapsed_;
593 381 : if (time < 0)
594 0 : time = 0;
595 381 : StartRestartTimer(time);
596 381 : stats_.llgr_timer++;
597 381 : set_membership_state(MEMBERSHIP_NONE);
598 381 : return result;
599 : }
600 :
601 1373 : TriggerSweepStateActions();
602 1373 : return result;
603 : }
604 :
605 63796 : void PeerCloseManager::FillRouteCloseInfo(PeerCloseInfo *close_info) const {
606 63796 : std::map<std::string, PeerCloseRouteInfo> route_stats;
607 :
608 701756 : for (int i = 0; i < Address::NUM_FAMILIES; i++) {
609 637960 : if (!stats_.route_stats[i].IsSet())
610 481016 : continue;
611 156944 : PeerCloseRouteInfo route_info;
612 156944 : route_info.set_staled(stats_.route_stats[i].staled);
613 156944 : route_info.set_llgr_staled(stats_.route_stats[i].llgr_staled);
614 156944 : route_info.set_refreshed(stats_.route_stats[i].refreshed);
615 156944 : route_info.set_fresh(stats_.route_stats[i].fresh);
616 156944 : route_info.set_deleted(stats_.route_stats[i].deleted);
617 156944 : route_stats[Address::FamilyToString(static_cast<Address::Family>(i))] = route_info;
618 156944 : }
619 :
620 63796 : if (!route_stats.empty())
621 62937 : close_info->set_route_stats(route_stats);
622 63796 : }
623 :
624 63796 : BgpNeighborResp *PeerCloseManager::FillCloseInfo(BgpNeighborResp *resp) const {
625 63796 : PeerCloseInfo peer_close_info;
626 63796 : peer_close_info.set_state(GetStateName(state_));
627 63796 : peer_close_info.set_membership_state(
628 127592 : GetMembershipStateName(membership_state_));
629 63796 : peer_close_info.set_close_again(close_again_);
630 63796 : peer_close_info.set_graceful(graceful_);
631 63796 : peer_close_info.set_init(stats_.init);
632 63796 : peer_close_info.set_close(stats_.close);
633 63796 : peer_close_info.set_nested(stats_.nested);
634 63796 : peer_close_info.set_deletes(stats_.deletes);
635 63796 : peer_close_info.set_stale(stats_.stale);
636 63796 : peer_close_info.set_llgr_stale(stats_.llgr_stale);
637 63796 : peer_close_info.set_sweep(stats_.sweep);
638 63796 : peer_close_info.set_gr_timer(stats_.gr_timer);
639 63796 : peer_close_info.set_llgr_timer(stats_.llgr_timer);
640 63796 : FillRouteCloseInfo(&peer_close_info);
641 :
642 63796 : resp->set_peer_close_info(peer_close_info);
643 :
644 63796 : return resp;
645 63796 : }
646 :
647 216366 : void PeerCloseManager::UpdateRouteStats(Address::Family family,
648 : const BgpPath *old_path, uint32_t path_flags) const {
649 216366 : if (state_ == NONE)
650 196667 : return;
651 :
652 19699 : if (!old_path)
653 66 : stats_.route_stats[family].fresh++;
654 19633 : else if (old_path->IsStale() && !(path_flags & BgpPath::Stale))
655 3272 : stats_.route_stats[family].refreshed++;
656 : }
657 :
658 99927 : bool PeerCloseManager::MembershipPathCallback(DBTablePartBase *root,
659 : BgpRoute *rt, BgpPath *path) {
660 99927 : CHECK_CONCURRENCY("db::DBTable");
661 99931 : DBRequest::DBOperation oper = DBRequest::DB_ENTRY_INVALID;
662 99931 : BgpAttrPtr attrs;
663 :
664 99931 : BgpTable *table = static_cast<BgpTable *>(root->parent());
665 99928 : assert(table);
666 :
667 99928 : uint32_t stale = 0;
668 :
669 99928 : switch (state_) {
670 0 : case NONE:
671 : case GR_TIMER:
672 : case LLGR_TIMER:
673 0 : return false;
674 :
675 5948 : case SWEEP:
676 :
677 : // Stale paths must be deleted.
678 5948 : if (!path->IsStale() && !path->IsLlgrStale())
679 2824 : return false;
680 3124 : if (path->IsStale()) {
681 3124 : path->ResetStale();
682 3124 : table->UpdateStalePathCount(-1);
683 : }
684 3126 : if (path->IsLlgrStale()) {
685 22 : path->ResetLlgrStale();
686 22 : table->UpdateLlgrStalePathCount(-1);
687 : }
688 3126 : oper = DBRequest::DB_ENTRY_DELETE;
689 3126 : attrs = NULL;
690 3126 : stats_.route_stats[table->family()].deleted++;
691 3126 : break;
692 :
693 76051 : case DELETE:
694 :
695 : // This path must be deleted. Hence attr is not required.
696 76051 : oper = DBRequest::DB_ENTRY_DELETE;
697 76051 : attrs = NULL;
698 76056 : stats_.route_stats[table->family()].deleted++;
699 76088 : break;
700 :
701 14665 : case STALE:
702 :
703 : // We do not support GR for multicast routes (yet).
704 29328 : if ((table->family() == Address::ERMVPN) ||
705 14664 : (table->family() == Address::MVPN)) {
706 0 : oper = DBRequest::DB_ENTRY_DELETE;
707 0 : attrs = NULL;
708 0 : stats_.route_stats[table->family()].deleted++;
709 0 : break;
710 : }
711 :
712 : // If path is already marked as stale, then there is no need to
713 : // process again. This can happen if the session flips while in
714 : // GR_TIMER state.
715 14662 : if (path->IsStale())
716 3341 : return false;
717 :
718 : // This path must be marked for staling. Update the local
719 : // preference and update the route accordingly.
720 11321 : oper = DBRequest::DB_ENTRY_ADD_CHANGE;
721 11321 : attrs = path->GetAttr();
722 11328 : stale = BgpPath::Stale;
723 11328 : stats_.route_stats[table->family()].staled++;
724 11332 : break;
725 :
726 3265 : case LLGR_STALE:
727 :
728 : // If the path has NO_LLGR community, DELETE it.
729 3265 : if (path->GetAttr()->community() &&
730 0 : path->GetAttr()->community()->ContainsValue(
731 : CommunityType::NoLlgr)) {
732 0 : oper = DBRequest::DB_ENTRY_DELETE;
733 0 : attrs = NULL;
734 0 : stats_.route_stats[table->family()].deleted++;
735 0 : break;
736 : }
737 :
738 : // If path is already marked as llgr_stale, then there is no
739 : // need to process again. This can happen if the session flips
740 : // while in LLGR_TIMER state.
741 3265 : if (path->IsLlgrStale())
742 0 : return false;
743 :
744 3266 : attrs = path->GetAttr();
745 3267 : stale = BgpPath::LlgrStale;
746 3267 : oper = DBRequest::DB_ENTRY_ADD_CHANGE;
747 3267 : stats_.route_stats[table->family()].llgr_staled++;
748 3270 : break;
749 : }
750 :
751 : // Feed the route modify/delete request to the table input process.
752 281420 : return table->InputCommon(root, rt, path, peer_close_->peer(), NULL, oper,
753 93804 : attrs, path->GetPathId(), path->GetFlags() | stale, path->GetLabel(),
754 93804 : path->GetL3Label());
755 99966 : }
756 :
757 : //
758 : // Handler for an Event.
759 : //
760 143686 : bool PeerCloseManager::EventCallback(Event *event) {
761 143686 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
762 : bool result;
763 :
764 143686 : switch (event->event_type) {
765 0 : case EVENT_NONE:
766 0 : break;
767 20914 : case CLOSE:
768 20914 : Close(event);
769 20914 : break;
770 15028 : case EOR_RECEIVED:
771 15028 : ProcessEORMarkerReceived(event);
772 15028 : break;
773 20191 : case MEMBERSHIP_REQUEST:
774 20191 : MembershipRequest(event);
775 20191 : break;
776 84774 : case MEMBERSHIP_REQUEST_COMPLETE_CALLBACK:
777 84774 : result = MembershipRequestCallback(event);
778 :
779 : // Notify clients if we are no longer using the membership mgr.
780 84774 : if (result)
781 11121 : peer_close_->MembershipRequestCallbackComplete();
782 84774 : break;
783 2779 : case TIMER_CALLBACK:
784 2779 : RestartTimerCallback(event);
785 2779 : break;
786 : }
787 :
788 143686 : delete event;
789 143686 : return true;
790 : }
|