59ce05edca3198cfe39b067dbe202e36cc4ac796
[netconf.git] / netconf / sal-netconf-connector / src / main / java / org / opendaylight / netconf / sal / connect / netconf / sal / KeepaliveSalFacade.java
1 /*
2  * Copyright (c) 2015 Cisco Systems, Inc. and others.  All rights reserved.
3  *
4  * This program and the accompanying materials are made available under the
5  * terms of the Eclipse Public License v1.0 which accompanies this distribution,
6  * and is available at http://www.eclipse.org/legal/epl-v10.html
7  */
8 package org.opendaylight.netconf.sal.connect.netconf.sal;
9
10 import static org.opendaylight.netconf.sal.connect.netconf.util.NetconfBaseOps.getSourceNode;
11 import static org.opendaylight.netconf.sal.connect.netconf.util.NetconfMessageTransformUtil.NETCONF_GET_CONFIG_NODEID;
12 import static org.opendaylight.netconf.sal.connect.netconf.util.NetconfMessageTransformUtil.NETCONF_GET_CONFIG_PATH;
13 import static org.opendaylight.netconf.sal.connect.netconf.util.NetconfMessageTransformUtil.NETCONF_RUNNING_QNAME;
14
15 import com.google.common.base.Preconditions;
16 import com.google.common.util.concurrent.FluentFuture;
17 import com.google.common.util.concurrent.FutureCallback;
18 import com.google.common.util.concurrent.Futures;
19 import com.google.common.util.concurrent.MoreExecutors;
20 import edu.umd.cs.findbugs.annotations.SuppressFBWarnings;
21 import java.util.concurrent.ScheduledExecutorService;
22 import java.util.concurrent.ScheduledFuture;
23 import java.util.concurrent.TimeUnit;
24 import java.util.concurrent.atomic.AtomicBoolean;
25 import javax.annotation.Nonnull;
26 import javax.annotation.Nullable;
27 import org.eclipse.jdt.annotation.NonNull;
28 import org.opendaylight.mdsal.dom.api.DOMActionService;
29 import org.opendaylight.mdsal.dom.api.DOMNotification;
30 import org.opendaylight.mdsal.dom.api.DOMRpcAvailabilityListener;
31 import org.opendaylight.mdsal.dom.api.DOMRpcResult;
32 import org.opendaylight.mdsal.dom.api.DOMRpcService;
33 import org.opendaylight.netconf.sal.connect.api.RemoteDeviceHandler;
34 import org.opendaylight.netconf.sal.connect.netconf.listener.NetconfDeviceCommunicator;
35 import org.opendaylight.netconf.sal.connect.netconf.listener.NetconfSessionPreferences;
36 import org.opendaylight.netconf.sal.connect.netconf.util.NetconfMessageTransformUtil;
37 import org.opendaylight.netconf.sal.connect.util.RemoteDeviceId;
38 import org.opendaylight.yangtools.concepts.ListenerRegistration;
39 import org.opendaylight.yangtools.yang.data.api.schema.ContainerNode;
40 import org.opendaylight.yangtools.yang.data.api.schema.NormalizedNode;
41 import org.opendaylight.yangtools.yang.model.api.SchemaContext;
42 import org.opendaylight.yangtools.yang.model.api.SchemaPath;
43 import org.slf4j.Logger;
44 import org.slf4j.LoggerFactory;
45
46 /**
47  * SalFacade proxy that invokes keepalive RPCs to prevent session shutdown from remote device
48  * and to detect incorrect session drops (netconf session is inactive, but TCP/SSH connection is still present).
49  * The keepalive RPC is a get-config with empty filter.
50  */
51 public final class KeepaliveSalFacade implements RemoteDeviceHandler<NetconfSessionPreferences> {
52
53     private static final Logger LOG = LoggerFactory.getLogger(KeepaliveSalFacade.class);
54
55     // 2 minutes keepalive delay by default
56     private static final long DEFAULT_DELAY = TimeUnit.MINUTES.toSeconds(2);
57
58     // 1 minute transaction timeout by default
59     private static final long DEFAULT_TRANSACTION_TIMEOUT_MILLI = TimeUnit.MILLISECONDS.toMillis(60000);
60
61     private final RemoteDeviceId id;
62     private final RemoteDeviceHandler<NetconfSessionPreferences> salFacade;
63     private final ScheduledExecutorService executor;
64     private final long keepaliveDelaySeconds;
65     private final ResetKeepalive resetKeepaliveTask;
66     private final long defaultRequestTimeoutMillis;
67
68     private volatile NetconfDeviceCommunicator listener;
69     private volatile ScheduledFuture<?> currentKeepalive;
70     private volatile DOMRpcService currentDeviceRpc;
71     private final AtomicBoolean lastKeepAliveSucceeded = new AtomicBoolean(false);
72
73     public KeepaliveSalFacade(final RemoteDeviceId id, final RemoteDeviceHandler<NetconfSessionPreferences> salFacade,
74                               final ScheduledExecutorService executor, final long keepaliveDelaySeconds,
75                               final long defaultRequestTimeoutMillis) {
76         this.id = id;
77         this.salFacade = salFacade;
78         this.executor = executor;
79         this.keepaliveDelaySeconds = keepaliveDelaySeconds;
80         this.defaultRequestTimeoutMillis = defaultRequestTimeoutMillis;
81         this.resetKeepaliveTask = new ResetKeepalive();
82     }
83
84     public KeepaliveSalFacade(final RemoteDeviceId id, final RemoteDeviceHandler<NetconfSessionPreferences> salFacade,
85                               final ScheduledExecutorService executor) {
86         this(id, salFacade, executor, DEFAULT_DELAY, DEFAULT_TRANSACTION_TIMEOUT_MILLI);
87     }
88
89     /**
90      * Set the netconf session listener whenever ready.
91      *
92      * @param listener netconf session listener
93      */
94     public void setListener(final NetconfDeviceCommunicator listener) {
95         this.listener = listener;
96     }
97
98     /**
99      * Just cancel current keepalive task.
100      * If its already started, let it finish ... not such a big deal.
101      *
102      * <p>
103      * Then schedule next keepalive.
104      */
105     void resetKeepalive() {
106         LOG.trace("{}: Resetting netconf keepalive timer", id);
107         if (currentKeepalive != null) {
108             currentKeepalive.cancel(false);
109         }
110         scheduleKeepalives();
111     }
112
113     /**
114      * Cancel current keepalive and also reset current deviceRpc.
115      */
116     private void stopKeepalives() {
117         if (currentKeepalive != null) {
118             currentKeepalive.cancel(false);
119         }
120         currentDeviceRpc = null;
121     }
122
123     void reconnect() {
124         Preconditions.checkState(listener != null, "%s: Unable to reconnect, session listener is missing", id);
125         stopKeepalives();
126         LOG.info("{}: Reconnecting inactive netconf session", id);
127         listener.disconnect();
128     }
129
130     @Override
131     public void onDeviceConnected(final SchemaContext remoteSchemaContext,
132                           final NetconfSessionPreferences netconfSessionPreferences, final DOMRpcService deviceRpc) {
133         onDeviceConnected(remoteSchemaContext, netconfSessionPreferences, deviceRpc, null);
134     }
135
136     @Override
137     public void onDeviceConnected(final SchemaContext remoteSchemaContext,
138             final NetconfSessionPreferences netconfSessionPreferences, final DOMRpcService deviceRpc,
139             final DOMActionService deviceAction) {
140         this.currentDeviceRpc = deviceRpc;
141         final DOMRpcService deviceRpc1 =
142                 new KeepaliveDOMRpcService(deviceRpc, resetKeepaliveTask, defaultRequestTimeoutMillis, executor);
143
144         salFacade.onDeviceConnected(remoteSchemaContext, netconfSessionPreferences, deviceRpc1, deviceAction);
145
146         LOG.debug("{}: Netconf session initiated, starting keepalives", id);
147         scheduleKeepalives();
148     }
149
150     private void scheduleKeepalives() {
151         lastKeepAliveSucceeded.set(true);
152         Preconditions.checkState(currentDeviceRpc != null);
153         LOG.trace("{}: Scheduling keepalives every  {} {}", id, keepaliveDelaySeconds, TimeUnit.SECONDS);
154         currentKeepalive = executor.scheduleWithFixedDelay(new Keepalive(),
155           keepaliveDelaySeconds, keepaliveDelaySeconds, TimeUnit.SECONDS);
156     }
157
158     @Override
159     public void onDeviceDisconnected() {
160         stopKeepalives();
161         salFacade.onDeviceDisconnected();
162     }
163
164     @Override
165     public void onDeviceFailed(final Throwable throwable) {
166         stopKeepalives();
167         salFacade.onDeviceFailed(throwable);
168     }
169
170     @Override
171     public void onNotification(final DOMNotification domNotification) {
172         resetKeepalive();
173         salFacade.onNotification(domNotification);
174     }
175
176     @Override
177     public void close() {
178         stopKeepalives();
179         salFacade.close();
180     }
181
182     // Keepalive RPC static resources
183     private static final ContainerNode KEEPALIVE_PAYLOAD = NetconfMessageTransformUtil.wrap(NETCONF_GET_CONFIG_NODEID,
184             getSourceNode(NETCONF_RUNNING_QNAME), NetconfMessageTransformUtil.EMPTY_FILTER);
185
186     /**
187      * Invoke keepalive RPC and check the response. In case of any received response the keepalive
188      * is considered successful and schedules next keepalive with a fixed delay. If the response is unsuccessful (no
189      * response received, or the rcp could not even be sent) immediate reconnect is triggered as netconf session
190      * is considered inactive/failed.
191      */
192     private class Keepalive implements Runnable, FutureCallback<DOMRpcResult> {
193
194         @Override
195         public void run() {
196             LOG.trace("{}: Invoking keepalive RPC", id);
197
198             try {
199                 boolean lastJobSucceeded = lastKeepAliveSucceeded.getAndSet(false);
200                 if (!lastJobSucceeded) {
201                     onFailure(new IllegalStateException("Previous keepalive timed out"));
202                 } else {
203                     Futures.addCallback(currentDeviceRpc.invokeRpc(NETCONF_GET_CONFIG_PATH, KEEPALIVE_PAYLOAD), this,
204                                         MoreExecutors.directExecutor());
205                 }
206             } catch (NullPointerException e) {
207                 LOG.debug("{}: Skipping keepalive while reconnecting", id);
208                 // Empty catch block intentional
209                 // Do nothing. The currentDeviceRpc was null and it means we hit the reconnect window and
210                 // attempted to send keepalive while we were reconnecting. Next keepalive will be scheduled
211                 // after reconnect so no action necessary here.
212             }
213         }
214
215         @SuppressFBWarnings(value = "RCN_REDUNDANT_NULLCHECK_OF_NONNULL_VALUE",
216                 justification = "Unrecognised NullableDecl")
217         @Override
218         public void onSuccess(final DOMRpcResult result) {
219             // No matter what response we got, rpc-reply or rpc-error,
220             // we got it from device so the netconf session is OK
221             if (result != null && result.getResult() != null) {
222                 lastKeepAliveSucceeded.set(true);
223             }  else if (result != null && result.getErrors() != null) {
224                 LOG.warn("{}: Keepalive RPC failed with error: {}", id, result.getErrors());
225                 lastKeepAliveSucceeded.set(true);
226             } else {
227                 LOG.warn("{} Keepalive RPC returned null with response. Reconnecting netconf session", id);
228                 reconnect();
229             }
230         }
231
232         @Override
233         public void onFailure(@Nonnull final Throwable throwable) {
234             LOG.warn("{}: Keepalive RPC failed. Reconnecting netconf session.", id, throwable);
235             reconnect();
236         }
237     }
238
239     /**
240      * Reset keepalive after each RPC response received.
241      */
242     private class ResetKeepalive implements FutureCallback<DOMRpcResult> {
243         @Override
244         public void onSuccess(@Nullable final DOMRpcResult result) {
245             // No matter what response we got,
246             // rpc-reply or rpc-error, we got it from device so the netconf session is OK.
247             resetKeepalive();
248         }
249
250         @Override
251         public void onFailure(@Nonnull final Throwable throwable) {
252             // User/Application RPC failed (The RPC did not reach the remote device or ..
253             // TODO what other reasons could cause this ?)
254             // There is no point in keeping this session. Reconnect.
255             LOG.warn("{}: Rpc failure detected. Reconnecting netconf session", id, throwable);
256             reconnect();
257         }
258     }
259
260     /*
261      * Request timeout task is called once the defaultRequestTimeoutMillis is
262      * reached. At this moment, if the request is not yet finished, we cancel
263      * it.
264      */
265     private static final class RequestTimeoutTask implements Runnable {
266
267         private final FluentFuture<DOMRpcResult> rpcResultFuture;
268
269         RequestTimeoutTask(final FluentFuture<DOMRpcResult> rpcResultFuture) {
270             this.rpcResultFuture = rpcResultFuture;
271         }
272
273         @Override
274         public void run() {
275             if (!rpcResultFuture.isDone()) {
276                 rpcResultFuture.cancel(true);
277             }
278         }
279     }
280
281     /**
282      * DOMRpcService proxy that attaches reset-keepalive-task and schedule
283      * request-timeout-task to each RPC invocation.
284      */
285     public static final class KeepaliveDOMRpcService implements DOMRpcService {
286
287         private final DOMRpcService deviceRpc;
288         private final ResetKeepalive resetKeepaliveTask;
289         private final long defaultRequestTimeoutMillis;
290         private final ScheduledExecutorService executor;
291
292         KeepaliveDOMRpcService(final DOMRpcService deviceRpc, final ResetKeepalive resetKeepaliveTask,
293                 final long defaultRequestTimeoutMillis, final ScheduledExecutorService executor) {
294             this.deviceRpc = deviceRpc;
295             this.resetKeepaliveTask = resetKeepaliveTask;
296             this.defaultRequestTimeoutMillis = defaultRequestTimeoutMillis;
297             this.executor = executor;
298         }
299
300         public DOMRpcService getDeviceRpc() {
301             return deviceRpc;
302         }
303
304         @Nonnull
305         @Override
306         public @NonNull FluentFuture<DOMRpcResult> invokeRpc(@Nonnull final SchemaPath type,
307                                                                       final NormalizedNode<?, ?> input) {
308             final FluentFuture<DOMRpcResult> rpcResultFuture = deviceRpc.invokeRpc(type, input);
309             Futures.addCallback(rpcResultFuture, resetKeepaliveTask, MoreExecutors.directExecutor());
310
311             final RequestTimeoutTask timeoutTask = new RequestTimeoutTask(rpcResultFuture);
312             executor.schedule(timeoutTask, defaultRequestTimeoutMillis, TimeUnit.MILLISECONDS);
313
314             return rpcResultFuture;
315         }
316
317         @Override
318         public <T extends DOMRpcAvailabilityListener> ListenerRegistration<T> registerRpcListener(
319                 @Nonnull final T listener) {
320             // There is no real communication with the device (yet), no reset here
321             return deviceRpc.registerRpcListener(listener);
322         }
323     }
324 }