Line data Source code
1 : /*
2 : * Copyright (c) 2013 Juniper Networks, Inc. All rights reserved.
3 : */
4 :
5 : #include "bgp/peer_close_manager.h"
6 :
7 :
8 : #include <list>
9 : #include <map>
10 :
11 : #include <boost/foreach.hpp>
12 :
13 : #include "base/task_annotations.h"
14 : #include "bgp/bgp_log.h"
15 : #include "bgp/bgp_membership.h"
16 : #include "bgp/bgp_peer_types.h"
17 : #include "bgp/bgp_route.h"
18 : #include "bgp/bgp_server.h"
19 : #include "bgp/routing-instance/routing_instance.h"
20 : #include "net/community_type.h"
21 :
22 : #define PEER_CLOSE_MANAGER_LOG(msg) \
23 : BGP_LOG_PEER(Event, peer_close_->peer(), SandeshLevel::SYS_INFO, \
24 : BGP_LOG_FLAG_ALL, BGP_PEER_DIR_NA, \
25 : "PeerCloseManager: State " << GetStateName(state_) << \
26 : ", MembershipState: " << GetMembershipStateName(membership_state_) << \
27 : ", MembershipReqPending: " << membership_req_pending_ << \
28 : ", CloseAgain?: " << (close_again_ ? "Yes" : "No") << ": " << msg);
29 :
30 : #define PEER_CLOSE_MANAGER_TABLE_LOG(msg) \
31 : BGP_LOG_PEER_TABLE(peer_close_->peer(), SandeshLevel::SYS_INFO, \
32 : BGP_LOG_FLAG_ALL, table, \
33 : "PeerCloseManager: State " << GetStateName(state_) << \
34 : ", MembershipState: " << GetMembershipStateName(membership_state_) << \
35 : ", MembershipReqPending: " << membership_req_pending_ << \
36 : ", CloseAgain?: " << (close_again_ ? "Yes" : "No") << ": " << msg);
37 :
38 : #define MOVE_TO_STATE(state) \
39 : do { \
40 : assert(state_ != state); \
41 : PEER_CLOSE_MANAGER_LOG("Move to state " << GetStateName(state)); \
42 : state_ = state; \
43 : } while (false)
44 :
45 : // Create an instance of PeerCloseManager with back reference to parent IPeer
46 8064 : PeerCloseManager::PeerCloseManager(IPeerClose *peer_close,
47 8064 : boost::asio::io_context *io_service) :
48 8064 : peer_close_(peer_close), gr_timer_(NULL),
49 16128 : event_queue_(new WorkQueue<Event *>(
50 24192 : TaskScheduler::GetInstance()->GetTaskId(
51 8064 : peer_close_->GetTaskName()),
52 8064 : peer_close_->GetTaskInstance(),
53 8064 : boost::bind(&PeerCloseManager::EventCallback, this, _1))),
54 8064 : state_(NONE), close_again_(false), graceful_(true), gr_elapsed_(0),
55 16128 : llgr_elapsed_(0), membership_state_(MEMBERSHIP_NONE) {
56 8064 : stats_.init++;
57 8064 : membership_req_pending_ = 0;
58 8064 : gr_timer_ = TimerManager::CreateTimer(*io_service,
59 : "Graceful Restart Timer");
60 8064 : }
61 :
62 : // Create an instance of PeerCloseManager with back reference to parent IPeer
63 20401 : PeerCloseManager::PeerCloseManager(IPeerClose *peer_close) :
64 20401 : peer_close_(peer_close), gr_timer_(NULL),
65 40804 : event_queue_(new WorkQueue<Event *>(
66 61206 : TaskScheduler::GetInstance()->GetTaskId(
67 20402 : peer_close_->GetTaskName()),
68 20402 : peer_close_->GetTaskInstance(),
69 20402 : boost::bind(&PeerCloseManager::EventCallback, this, _1))),
70 20402 : state_(NONE), close_again_(false), graceful_(true), gr_elapsed_(0),
71 40803 : llgr_elapsed_(0), membership_state_(MEMBERSHIP_NONE) {
72 20402 : stats_.init++;
73 20402 : membership_req_pending_ = 0;
74 20402 : if (peer_close->peer() && peer_close->peer()->server()) {
75 16587 : gr_timer_ =
76 16587 : TimerManager::CreateTimer(*peer_close->peer()->server()->ioservice(),
77 : "Graceful Restart Timer");
78 : }
79 20402 : }
80 :
81 45853 : PeerCloseManager::~PeerCloseManager() {
82 28466 : event_queue_->Shutdown();
83 28466 : TimerManager::DeleteTimer(gr_timer_);
84 45853 : }
85 :
86 226530 : std::string PeerCloseManager::GetStateName(State state) const {
87 226530 : switch (state) {
88 32581 : case NONE:
89 32581 : return "NONE";
90 68887 : case GR_TIMER:
91 68887 : return "GR_TIMER";
92 19502 : case STALE:
93 19502 : return "STALE";
94 5902 : case LLGR_STALE:
95 5902 : return "LLGR_STALE";
96 6630 : case LLGR_TIMER:
97 6630 : return "LLGR_TIMER";
98 10790 : case SWEEP:
99 10790 : return "SWEEP";
100 82238 : case DELETE:
101 82238 : return "DELETE";
102 : }
103 0 : assert(false);
104 : return "";
105 : }
106 :
107 204399 : std::string PeerCloseManager::GetMembershipStateName(
108 : MembershipState state) const {
109 204399 : switch (state) {
110 91861 : case MEMBERSHIP_NONE:
111 91861 : return "NONE";
112 108177 : case MEMBERSHIP_IN_USE:
113 108177 : return "IN_USE";
114 4361 : case MEMBERSHIP_IN_WAIT:
115 4361 : return "IN_WAIT";
116 : }
117 0 : assert(false);
118 : return "";
119 : }
120 :
121 53991 : std::string PeerCloseManager::GetEventName(EventType eventType) const {
122 53991 : switch (eventType) {
123 0 : case EVENT_NONE:
124 0 : return "NONE";
125 10176 : case CLOSE:
126 10176 : return "CLOSE";
127 5553 : case EOR_RECEIVED:
128 5553 : return "EOR_RECEIVED";
129 9705 : case MEMBERSHIP_REQUEST:
130 9705 : return "MEMBERSHIP_REQUEST";
131 25711 : case MEMBERSHIP_REQUEST_COMPLETE_CALLBACK:
132 25711 : return "MEMBERSHIP_REQUEST_COMPLETE_CALLBACK";
133 2846 : case TIMER_CALLBACK:
134 2846 : return "TIMER_CALLBACK";
135 : }
136 :
137 0 : return "";
138 : }
139 :
140 143329 : void PeerCloseManager::EnqueueEvent(Event *event) {
141 163877 : PEER_CLOSE_MANAGER_LOG("Enqueued event " <<
142 : GetEventName(event->event_type) <<
143 : ", graceful " << event->graceful <<
144 : ", family " << Address::FamilyToString(event->family));
145 143360 : event_queue_->Enqueue(event);
146 143543 : }
147 :
148 : // Trigger closure of an IPeer
149 : //
150 : // Graceful close_state_: NONE
151 : // RibIn Stale Marking and Ribout deletion close_state_: STALE
152 : // StateMachine restart and GR timer start close_state_: GR_TIMER
153 : //
154 : // Peer IsReady() in GR timer callback (or via reception of all EoRs)
155 : // RibIn Sweep and Ribout Generation close_state_: SWEEP
156 : // MembershipRequestCallback close_state_: NONE
157 : //
158 : // Peer not IsReady() in GR timer callback
159 : // If LLGR supported close_state_: LLGR_STALE
160 : // RibIn Stale marking with LLGR_STALE community close_state_: LLGR_TIMER
161 : //
162 : // Peer not IsReady() in LLGR timer callback
163 : // RibIn Delete close_state_: DELETE
164 : // MembershipRequestCallback close_state_: NONE
165 : //
166 : // Peer IsReady() in LLGR timer callback (or via reception of all EoRs)
167 : // RibIn Sweep close_state_: SWEEP
168 : // MembershipRequestCallback close_state_: NONE
169 : //
170 : // If LLGR is not supported
171 : // RibIn Delete close_state_: DELETE
172 : // MembershipRequestCallback close_state_: NONE
173 : //
174 : // Close() call during any state other than NONE and DELETE
175 : // Cancel GR timer and restart GR Closure all over again
176 : //
177 : // NonGraceful close_state_ = * (except DELETE)
178 : // A. RibIn deletion and Ribout deletion close_state_ = DELETE
179 : // B. MembershipRequestCallback => Peers delete/StateMachine restart
180 : // close_state_ = NONE
181 : //
182 : // If Close is restarted, account for GR timer's elapsed time.
183 : //
184 : // Use graceful as true to close gracefully.
185 20924 : void PeerCloseManager::Close(bool graceful) {
186 20924 : EnqueueEvent(new Event(CLOSE, graceful));
187 20925 : }
188 :
189 20925 : void PeerCloseManager::Close(Event *event) {
190 : // Note down non-graceful close trigger. Once non-graceful closure is
191 : // triggered, it should remain so until close process is complete. Further
192 : // graceful closure calls until then should remain non-graceful.
193 20925 : graceful_ &= event->graceful;
194 20925 : CloseInternal();
195 20925 : }
196 :
197 21458 : void PeerCloseManager::CloseInternal() {
198 21458 : stats_.close++;
199 :
200 : // Ignore nested closures
201 21458 : if (close_again_) {
202 4 : PEER_CLOSE_MANAGER_LOG("Nested close calls ignored");
203 4 : return;
204 : }
205 :
206 21454 : switch (state_) {
207 19914 : case NONE:
208 19914 : stats_.ResetRouteStats();
209 19914 : ProcessClosure();
210 19914 : break;
211 :
212 337 : case GR_TIMER:
213 463 : PEER_CLOSE_MANAGER_LOG("Nested close: Restart GR");
214 337 : close_again_ = true;
215 337 : stats_.nested++;
216 337 : gr_elapsed_ += gr_timer_->GetElapsedTime();
217 337 : CloseComplete();
218 337 : break;
219 :
220 196 : case LLGR_TIMER:
221 196 : PEER_CLOSE_MANAGER_LOG("Nested close: Restart LLGR");
222 196 : close_again_ = true;
223 196 : stats_.nested++;
224 196 : llgr_elapsed_ += gr_timer_->GetElapsedTime();
225 196 : CloseComplete();
226 196 : break;
227 :
228 1007 : case STALE:
229 : case LLGR_STALE:
230 : case SWEEP:
231 : case DELETE:
232 1007 : PEER_CLOSE_MANAGER_LOG("Nested close");
233 1007 : close_again_ = true;
234 1007 : stats_.nested++;
235 1007 : break;
236 : }
237 : }
238 :
239 14829 : void PeerCloseManager::ProcessEORMarkerReceived(Address::Family family) {
240 14829 : EnqueueEvent(new Event(EOR_RECEIVED, family));
241 14833 : }
242 :
243 14834 : void PeerCloseManager::ProcessEORMarkerReceived(Event *event) {
244 14834 : if ((state_ == GR_TIMER || state_ == LLGR_TIMER) && !families_.empty()) {
245 1843 : if (event->family == Address::UNSPEC) {
246 40 : families_.clear();
247 : } else {
248 1803 : families_.erase(event->family);
249 : }
250 :
251 : // Start the timer if all EORs have been received.
252 1843 : if (families_.empty())
253 1234 : StartRestartTimer(0);
254 : }
255 14834 : }
256 :
257 : // Process RibIn during peer closure.
258 2700 : void PeerCloseManager::StartRestartTimer(int time) {
259 2700 : gr_timer_->Cancel();
260 2964 : PEER_CLOSE_MANAGER_LOG("GR Timer started to fire after " << time/1000 <<
261 : " seconds");
262 2700 : gr_timer_->Start(time,
263 : boost::bind(&PeerCloseManager::RestartTimerCallback, this));
264 2700 : }
265 :
266 2849 : bool PeerCloseManager::RestartTimerCallback() {
267 2849 : CHECK_CONCURRENCY("timer::TimerTask");
268 2847 : EnqueueEvent(new Event(TIMER_CALLBACK));
269 2849 : return false;
270 : }
271 :
272 2850 : void PeerCloseManager::RestartTimerCallback(Event *event) {
273 2850 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
274 :
275 2960 : PEER_CLOSE_MANAGER_LOG("GR Timer callback started");
276 2850 : if (state_ != GR_TIMER && state_ != LLGR_TIMER)
277 960 : return;
278 :
279 1890 : if (peer_close_->IsReady() && !families_.empty()) {
280 : // Fake reception of all EORs.
281 204 : for (IPeerClose::Families::iterator i = families_.begin(), next = i;
282 408 : i != families_.end(); i = next) {
283 204 : next++;
284 216 : PEER_CLOSE_MANAGER_LOG("Simulate EoR reception for family " << *i);
285 204 : peer_close_->ReceiveEndOfRIB(*i);
286 : }
287 : } else {
288 1686 : ProcessClosure();
289 : }
290 : }
291 :
292 : // Route stale timer callback. If the peer has come back up, sweep routes for
293 : // those address families that are still active. Delete the rest
294 21600 : void PeerCloseManager::ProcessClosure() {
295 : // If the peer is back up and this address family is still supported,
296 : // sweep old paths which may not have come back in the new session
297 21600 : switch (state_) {
298 19914 : case NONE:
299 19914 : if (!graceful_ || !peer_close_->IsCloseGraceful()) {
300 19678 : MOVE_TO_STATE(DELETE);
301 18879 : stats_.deletes++;
302 : } else {
303 1230 : MOVE_TO_STATE(STALE);
304 1035 : stats_.stale++;
305 1035 : StaleNotify();
306 1035 : return;
307 : }
308 18879 : break;
309 1121 : case GR_TIMER:
310 1121 : if (peer_close_->IsReady()) {
311 757 : MOVE_TO_STATE(SWEEP);
312 717 : gr_elapsed_ = 0;
313 717 : llgr_elapsed_ = 0;
314 717 : stats_.sweep++;
315 717 : break;
316 : }
317 404 : if (peer_close_->IsCloseLongLivedGraceful()) {
318 312 : MOVE_TO_STATE(LLGR_STALE);
319 283 : stats_.llgr_stale++;
320 283 : peer_close_->LongLivedGracefulRestartStale();
321 283 : break;
322 : }
323 121 : MOVE_TO_STATE(DELETE);
324 121 : stats_.deletes++;
325 121 : break;
326 :
327 565 : case LLGR_TIMER:
328 565 : if (peer_close_->IsReady()) {
329 317 : MOVE_TO_STATE(SWEEP);
330 317 : gr_elapsed_ = 0;
331 317 : llgr_elapsed_ = 0;
332 317 : stats_.sweep++;
333 317 : break;
334 : }
335 277 : MOVE_TO_STATE(DELETE);
336 248 : stats_.deletes++;
337 248 : break;
338 :
339 0 : case STALE:
340 : case LLGR_STALE:
341 : case SWEEP:
342 : case DELETE:
343 0 : assert(false);
344 : return;
345 : }
346 :
347 20565 : if (state_ == DELETE)
348 19248 : peer_close_->CustomClose();
349 20565 : MembershipRequest();
350 : }
351 :
352 1382 : void PeerCloseManager::CloseComplete() {
353 1548 : MOVE_TO_STATE(NONE);
354 1382 : gr_timer_->Cancel();
355 1382 : families_.clear();
356 1382 : stats_.init++;
357 :
358 : // Nested closures trigger fresh GR
359 1382 : if (close_again_) {
360 533 : close_again_ = false;
361 533 : CloseInternal();
362 : }
363 1382 : }
364 :
365 1425 : bool PeerCloseManager::AssertSweepState(bool do_assert) {
366 1425 : bool check = (state_ == SWEEP);
367 1425 : if (do_assert)
368 657 : assert(check);
369 1425 : return check;
370 : }
371 :
372 95152 : bool PeerCloseManager::AssertMembershipManagerInUse(bool do_assert) {
373 95152 : bool check = false;
374 181526 : check |= (state_ == STALE || state_ == LLGR_STALE || state_ == SWEEP ||
375 86374 : state_ == DELETE);
376 95152 : check |= (membership_state_ == MEMBERSHIP_IN_USE);
377 95152 : check |= (membership_req_pending_ > 0);
378 95152 : if (do_assert)
379 93808 : assert(check);
380 95152 : return check;
381 : }
382 :
383 22997 : bool PeerCloseManager::AssertMembershipState(bool do_assert) {
384 22997 : bool check = (membership_state_ != MEMBERSHIP_IN_USE);
385 22997 : if (do_assert)
386 20324 : assert(check);
387 22997 : return check;
388 : }
389 :
390 21204 : bool PeerCloseManager::AssertMembershipReqCount(bool do_assert) {
391 21204 : bool check = !membership_req_pending_;
392 21204 : if (do_assert)
393 20271 : assert(check);
394 21204 : return check;
395 : }
396 :
397 1425 : void PeerCloseManager::TriggerSweepStateActions() {
398 1425 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
399 1425 : if (!AssertSweepState())
400 576 : return;
401 :
402 : // Notify clients to trigger sweep as appropriate.
403 849 : peer_close_->GracefulRestartSweep();
404 :
405 : // Reset MembershipUse state after client has been notified above.
406 849 : set_membership_state(MEMBERSHIP_NONE);
407 849 : CloseComplete();
408 : }
409 :
410 : // Notify clients about entering Stale event.
411 1035 : void PeerCloseManager::StaleNotify() {
412 1035 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
413 :
414 1035 : peer_close_->GracefulRestartStale();
415 1035 : if (!AssertMembershipState())
416 48 : return;
417 987 : MembershipRequest(NULL);
418 : }
419 :
420 19433 : bool PeerCloseManager::CanUseMembershipManager() const {
421 19433 : return peer_close_->peer()->CanUseMembershipManager();
422 : }
423 :
424 20271 : void PeerCloseManager::GetRegisteredRibs(std::list<BgpTable *> *tables) {
425 20271 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
426 20271 : mgr->GetRegisteredRibs(peer_close_->peer(), tables);
427 20271 : }
428 :
429 83389 : bool PeerCloseManager::IsRegistered(BgpTable *table) const {
430 83389 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
431 83389 : return mgr->IsRegistered(peer_close_->peer(), table);
432 : }
433 :
434 73386 : void PeerCloseManager::Unregister(BgpTable *table) {
435 73386 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
436 73386 : mgr->Unregister(peer_close_->peer(), table);
437 73386 : }
438 :
439 3818 : void PeerCloseManager::WalkRibIn(BgpTable *table) {
440 3818 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
441 3818 : mgr->WalkRibIn(peer_close_->peer(), table);
442 3818 : }
443 :
444 4384 : void PeerCloseManager::UnregisterRibOut(BgpTable *table) {
445 4384 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
446 4384 : mgr->UnregisterRibOut(peer_close_->peer(), table);
447 4384 : }
448 :
449 4010 : bool PeerCloseManager::IsRibInRegistered(BgpTable *table) const {
450 4010 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
451 4010 : return mgr->IsRibInRegistered(peer_close_->peer(), table);
452 : }
453 :
454 1801 : void PeerCloseManager::UnregisterRibIn(BgpTable *table) {
455 1801 : BgpMembershipManager *mgr = peer_close_->peer()->server()->membership_mgr();
456 1801 : mgr->UnregisterRibIn(peer_close_->peer(), table);
457 1801 : }
458 :
459 21962 : void PeerCloseManager::MembershipRequest() {
460 21962 : if (!AssertMembershipState())
461 848 : return;
462 :
463 : // Pause if membership manager is not ready for usage.
464 21114 : if (!CanUseMembershipManager()) {
465 897 : set_membership_state(MEMBERSHIP_IN_WAIT);
466 933 : PEER_CLOSE_MANAGER_LOG("Wait for membership manager availability");
467 897 : return;
468 : }
469 20217 : set_membership_state(MEMBERSHIP_IN_USE);
470 20217 : EnqueueEvent(new Event(MEMBERSHIP_REQUEST));
471 : }
472 :
473 21204 : void PeerCloseManager::MembershipRequest(Event *evnet) {
474 21204 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
475 :
476 21204 : set_membership_state(MEMBERSHIP_IN_USE);
477 21204 : if (!AssertMembershipReqCount())
478 10867 : return;
479 20756 : membership_req_pending_++;
480 20756 : std::list<BgpTable *> tables;
481 20756 : GetRegisteredRibs(&tables);
482 :
483 20756 : if (tables.empty()) {
484 10419 : assert(MembershipRequestCallback(NULL));
485 10419 : return;
486 : }
487 :
488 : // Account for extra increment above.
489 10337 : membership_req_pending_--;
490 178085 : BOOST_FOREACH(BgpTable *table, tables) {
491 83874 : membership_req_pending_++;
492 83874 : if (IsRegistered(table)) {
493 79623 : if (state_ == PeerCloseManager::DELETE) {
494 100113 : PEER_CLOSE_MANAGER_TABLE_LOG(
495 : "MembershipManager::Unregister");
496 73505 : Unregister(table);
497 6118 : } else if (state_ == PeerCloseManager::SWEEP) {
498 3696 : PEER_CLOSE_MANAGER_TABLE_LOG("MembershipManager::WalkRibIn");
499 1671 : WalkRibIn(table);
500 : } else {
501 11709 : PEER_CLOSE_MANAGER_TABLE_LOG(
502 : "MembershipManager::UnregisterRibOut");
503 4447 : UnregisterRibOut(table);
504 : }
505 : } else {
506 4251 : assert(IsRibInRegistered(table));
507 4251 : if (state_ == PeerCloseManager::DELETE) {
508 5027 : PEER_CLOSE_MANAGER_TABLE_LOG(
509 : "MembershipManager::UnregisterRibIn");
510 1918 : UnregisterRibIn(table);
511 : } else {
512 6123 : PEER_CLOSE_MANAGER_TABLE_LOG("MembershipManager::WalkRibIn");
513 2333 : WalkRibIn(table);
514 : }
515 : }
516 : }
517 20756 : }
518 :
519 84505 : void PeerCloseManager::MembershipRequestCallback() {
520 84505 : EnqueueEvent(new Event(MEMBERSHIP_REQUEST_COMPLETE_CALLBACK));
521 84721 : }
522 :
523 : // Close process for this peer in terms of walking RibIns and RibOuts are
524 : // complete. Do the final cleanups necessary and notify interested party
525 : //
526 : // Retrun true if we are done using membership manager, false otherwise.
527 95152 : bool PeerCloseManager::MembershipRequestCallback(Event *event) {
528 95152 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
529 :
530 95152 : bool result = false;
531 113763 : PEER_CLOSE_MANAGER_LOG("MembershipRequestCallback");
532 :
533 95152 : if (!AssertMembershipManagerInUse())
534 0 : return result;
535 95152 : if (--membership_req_pending_)
536 73537 : return result;
537 :
538 : // Indicate to the caller that we are done using the membership manager.
539 21615 : result = true;
540 :
541 21615 : if (state_ == DELETE) {
542 19552 : MOVE_TO_STATE(NONE);
543 18724 : peer_close_->Delete();
544 18724 : gr_elapsed_ = 0;
545 18724 : llgr_elapsed_ = 0;
546 18724 : stats_.init++;
547 18724 : close_again_ = false;
548 18724 : graceful_ = true;
549 18724 : set_membership_state(MEMBERSHIP_NONE);
550 18724 : return result;
551 : }
552 :
553 : // Process nested closures.
554 2891 : if (close_again_) {
555 0 : set_membership_state(MEMBERSHIP_NONE);
556 0 : CloseComplete();
557 :
558 : // Nested closure can make membership manager to be in use again.
559 0 : return membership_state_ != MEMBERSHIP_IN_USE;
560 : }
561 :
562 : // If any GR stale timer has to be launched, then to wait for some time
563 : // hoping for the peer (and the paths) to come back up.
564 2891 : if (state_ == STALE) {
565 1083 : peer_close_->CloseComplete();
566 1278 : MOVE_TO_STATE(GR_TIMER);
567 1083 : peer_close_->GetGracefulRestartFamilies(&families_);
568 :
569 : // Offset restart time with elapsed time during nested closures.
570 1083 : int time = peer_close_->GetGracefulRestartTime() * 1000;
571 1083 : time -= gr_elapsed_;
572 1083 : if (time < 0)
573 0 : time = 0;
574 1083 : StartRestartTimer(time);
575 1083 : stats_.gr_timer++;
576 1083 : set_membership_state(MEMBERSHIP_NONE);
577 1083 : return result;
578 : }
579 :
580 : // From LLGR_STALE state, switch to LLGR_TIMER state. Typically this would
581 : // be a very long timer, and we expect to receive EORs before this timer
582 : // expires.
583 : // Just like for GRSTALE in the above case, before moving to LLGR_TIMER and
584 : // starting LLGR_TIMER, we can check if the peer can come back up.
585 1808 : if (state_ == LLGR_STALE) {
586 412 : MOVE_TO_STATE(LLGR_TIMER);
587 383 : peer_close_->CloseComplete();
588 383 : peer_close_->GetLongLivedGracefulRestartFamilies(&families_);
589 :
590 : // Offset restart time with elapsed time during nested closures.
591 383 : int time = peer_close_->GetLongLivedGracefulRestartTime() * 1000;
592 383 : time -= llgr_elapsed_;
593 383 : if (time < 0)
594 0 : time = 0;
595 383 : StartRestartTimer(time);
596 383 : stats_.llgr_timer++;
597 383 : set_membership_state(MEMBERSHIP_NONE);
598 383 : return result;
599 : }
600 :
601 1425 : TriggerSweepStateActions();
602 1425 : return result;
603 : }
604 :
605 63237 : void PeerCloseManager::FillRouteCloseInfo(PeerCloseInfo *close_info) const {
606 63237 : std::map<std::string, PeerCloseRouteInfo> route_stats;
607 :
608 695607 : for (int i = 0; i < Address::NUM_FAMILIES; i++) {
609 632370 : if (!stats_.route_stats[i].IsSet())
610 476847 : continue;
611 155523 : PeerCloseRouteInfo route_info;
612 155523 : route_info.set_staled(stats_.route_stats[i].staled);
613 155523 : route_info.set_llgr_staled(stats_.route_stats[i].llgr_staled);
614 155523 : route_info.set_refreshed(stats_.route_stats[i].refreshed);
615 155523 : route_info.set_fresh(stats_.route_stats[i].fresh);
616 155523 : route_info.set_deleted(stats_.route_stats[i].deleted);
617 155523 : route_stats[Address::FamilyToString(static_cast<Address::Family>(i))] = route_info;
618 155523 : }
619 :
620 63237 : if (!route_stats.empty())
621 62359 : close_info->set_route_stats(route_stats);
622 63237 : }
623 :
624 63237 : BgpNeighborResp *PeerCloseManager::FillCloseInfo(BgpNeighborResp *resp) const {
625 63237 : PeerCloseInfo peer_close_info;
626 63237 : peer_close_info.set_state(GetStateName(state_));
627 63237 : peer_close_info.set_membership_state(
628 126474 : GetMembershipStateName(membership_state_));
629 63237 : peer_close_info.set_close_again(close_again_);
630 63237 : peer_close_info.set_graceful(graceful_);
631 63237 : peer_close_info.set_init(stats_.init);
632 63237 : peer_close_info.set_close(stats_.close);
633 63237 : peer_close_info.set_nested(stats_.nested);
634 63237 : peer_close_info.set_deletes(stats_.deletes);
635 63237 : peer_close_info.set_stale(stats_.stale);
636 63237 : peer_close_info.set_llgr_stale(stats_.llgr_stale);
637 63237 : peer_close_info.set_sweep(stats_.sweep);
638 63237 : peer_close_info.set_gr_timer(stats_.gr_timer);
639 63237 : peer_close_info.set_llgr_timer(stats_.llgr_timer);
640 63237 : FillRouteCloseInfo(&peer_close_info);
641 :
642 63237 : resp->set_peer_close_info(peer_close_info);
643 :
644 63237 : return resp;
645 63237 : }
646 :
647 216673 : void PeerCloseManager::UpdateRouteStats(Address::Family family,
648 : const BgpPath *old_path, uint32_t path_flags) const {
649 216673 : if (state_ == NONE)
650 196760 : return;
651 :
652 19913 : if (!old_path)
653 51 : stats_.route_stats[family].fresh++;
654 19862 : else if (old_path->IsStale() && !(path_flags & BgpPath::Stale))
655 3408 : stats_.route_stats[family].refreshed++;
656 : }
657 :
658 100736 : bool PeerCloseManager::MembershipPathCallback(DBTablePartBase *root,
659 : BgpRoute *rt, BgpPath *path) {
660 100736 : CHECK_CONCURRENCY("db::DBTable");
661 100742 : DBRequest::DBOperation oper = DBRequest::DB_ENTRY_INVALID;
662 100742 : BgpAttrPtr attrs;
663 :
664 100742 : BgpTable *table = static_cast<BgpTable *>(root->parent());
665 100741 : assert(table);
666 :
667 100741 : uint32_t stale = 0;
668 :
669 100741 : switch (state_) {
670 0 : case NONE:
671 : case GR_TIMER:
672 : case LLGR_TIMER:
673 0 : return false;
674 :
675 6026 : case SWEEP:
676 :
677 : // Stale paths must be deleted.
678 6026 : if (!path->IsStale() && !path->IsLlgrStale())
679 2907 : return false;
680 3120 : if (path->IsStale()) {
681 3120 : path->ResetStale();
682 3121 : table->UpdateStalePathCount(-1);
683 : }
684 3123 : if (path->IsLlgrStale()) {
685 0 : path->ResetLlgrStale();
686 0 : table->UpdateLlgrStalePathCount(-1);
687 : }
688 3121 : oper = DBRequest::DB_ENTRY_DELETE;
689 3121 : attrs = NULL;
690 3121 : stats_.route_stats[table->family()].deleted++;
691 3123 : break;
692 :
693 76745 : case DELETE:
694 :
695 : // This path must be deleted. Hence attr is not required.
696 76745 : oper = DBRequest::DB_ENTRY_DELETE;
697 76745 : attrs = NULL;
698 76744 : stats_.route_stats[table->family()].deleted++;
699 76776 : break;
700 :
701 14739 : case STALE:
702 :
703 : // We do not support GR for multicast routes (yet).
704 29476 : if ((table->family() == Address::ERMVPN) ||
705 14738 : (table->family() == Address::MVPN)) {
706 0 : oper = DBRequest::DB_ENTRY_DELETE;
707 0 : attrs = NULL;
708 0 : stats_.route_stats[table->family()].deleted++;
709 0 : break;
710 : }
711 :
712 : // If path is already marked as stale, then there is no need to
713 : // process again. This can happen if the session flips while in
714 : // GR_TIMER state.
715 14737 : if (path->IsStale())
716 3275 : return false;
717 :
718 : // This path must be marked for staling. Update the local
719 : // preference and update the route accordingly.
720 11462 : oper = DBRequest::DB_ENTRY_ADD_CHANGE;
721 11462 : attrs = path->GetAttr();
722 11465 : stale = BgpPath::Stale;
723 11465 : stats_.route_stats[table->family()].staled++;
724 11465 : break;
725 :
726 3233 : case LLGR_STALE:
727 :
728 : // If the path has NO_LLGR community, DELETE it.
729 3233 : if (path->GetAttr()->community() &&
730 0 : path->GetAttr()->community()->ContainsValue(
731 : CommunityType::NoLlgr)) {
732 0 : oper = DBRequest::DB_ENTRY_DELETE;
733 0 : attrs = NULL;
734 0 : stats_.route_stats[table->family()].deleted++;
735 0 : break;
736 : }
737 :
738 : // If path is already marked as llgr_stale, then there is no
739 : // need to process again. This can happen if the session flips
740 : // while in LLGR_TIMER state.
741 3232 : if (path->IsLlgrStale())
742 0 : return false;
743 :
744 3233 : attrs = path->GetAttr();
745 3235 : stale = BgpPath::LlgrStale;
746 3235 : oper = DBRequest::DB_ENTRY_ADD_CHANGE;
747 3235 : stats_.route_stats[table->family()].llgr_staled++;
748 3236 : break;
749 : }
750 :
751 : // Feed the route modify/delete request to the table input process.
752 283790 : return table->InputCommon(root, rt, path, peer_close_->peer(), NULL, oper,
753 94597 : attrs, path->GetPathId(), path->GetFlags() | stale, path->GetLabel(),
754 94596 : path->GetL3Label());
755 100776 : }
756 :
757 : //
758 : // Handler for an Event.
759 : //
760 143559 : bool PeerCloseManager::EventCallback(Event *event) {
761 143559 : CHECK_CONCURRENCY(peer_close_->GetTaskName());
762 : bool result;
763 :
764 143559 : switch (event->event_type) {
765 0 : case EVENT_NONE:
766 0 : break;
767 20925 : case CLOSE:
768 20925 : Close(event);
769 20925 : break;
770 14834 : case EOR_RECEIVED:
771 14834 : ProcessEORMarkerReceived(event);
772 14834 : break;
773 20217 : case MEMBERSHIP_REQUEST:
774 20217 : MembershipRequest(event);
775 20217 : break;
776 84733 : case MEMBERSHIP_REQUEST_COMPLETE_CALLBACK:
777 84733 : result = MembershipRequestCallback(event);
778 :
779 : // Notify clients if we are no longer using the membership mgr.
780 84733 : if (result)
781 11196 : peer_close_->MembershipRequestCallbackComplete();
782 84733 : break;
783 2850 : case TIMER_CALLBACK:
784 2850 : RestartTimerCallback(event);
785 2850 : break;
786 : }
787 :
788 143559 : delete event;
789 143559 : return true;
790 : }
|