blob: 44fbea038c32bc2110aa892a615a40b261032d4c [file] [log] [blame]
Madan Jampani84b6b402015-02-25 17:49:54 -08001/*
2 * Copyright 2015 Open Networking Laboratory
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16package org.onosproject.store.mastership.impl;
17
18import static org.onlab.util.Tools.groupedThreads;
Ayaka Koshibe941f8602015-04-15 14:17:08 -070019import static org.onlab.util.Tools.futureGetOrElse;
Madan Jampani0f6ad142015-05-13 17:10:04 -070020import static org.onosproject.mastership.MastershipEvent.Type.BACKUPS_CHANGED;
Madan Jampani84b6b402015-02-25 17:49:54 -080021import static org.onosproject.mastership.MastershipEvent.Type.MASTER_CHANGED;
22import static org.slf4j.LoggerFactory.getLogger;
23import static com.google.common.base.Preconditions.checkArgument;
24
Madan Jampani84b6b402015-02-25 17:49:54 -080025import java.util.List;
26import java.util.Map;
27import java.util.Set;
Madan Jampanif7536ab2015-05-07 23:23:23 -070028import java.util.concurrent.CompletableFuture;
Madan Jampani84b6b402015-02-25 17:49:54 -080029import java.util.concurrent.ExecutorService;
30import java.util.concurrent.Executors;
Madan Jampanif7536ab2015-05-07 23:23:23 -070031import java.util.concurrent.ScheduledExecutorService;
32import java.util.concurrent.TimeUnit;
Madan Jampani84b6b402015-02-25 17:49:54 -080033import java.util.regex.Matcher;
34import java.util.regex.Pattern;
35import java.util.stream.Collectors;
36
37import org.apache.felix.scr.annotations.Activate;
38import org.apache.felix.scr.annotations.Component;
39import org.apache.felix.scr.annotations.Deactivate;
40import org.apache.felix.scr.annotations.Reference;
41import org.apache.felix.scr.annotations.ReferenceCardinality;
42import org.apache.felix.scr.annotations.Service;
43import org.onlab.util.KryoNamespace;
44import org.onosproject.cluster.ClusterService;
45import org.onosproject.cluster.Leadership;
46import org.onosproject.cluster.LeadershipEvent;
47import org.onosproject.cluster.LeadershipEventListener;
48import org.onosproject.cluster.LeadershipService;
49import org.onosproject.cluster.NodeId;
50import org.onosproject.cluster.RoleInfo;
51import org.onosproject.mastership.MastershipEvent;
52import org.onosproject.mastership.MastershipStore;
53import org.onosproject.mastership.MastershipStoreDelegate;
54import org.onosproject.mastership.MastershipTerm;
55import org.onosproject.net.DeviceId;
56import org.onosproject.net.MastershipRole;
57import org.onosproject.store.AbstractStore;
58import org.onosproject.store.cluster.messaging.ClusterCommunicationService;
Madan Jampani84b6b402015-02-25 17:49:54 -080059import org.onosproject.store.cluster.messaging.MessageSubject;
60import org.onosproject.store.serializers.KryoNamespaces;
61import org.onosproject.store.serializers.KryoSerializer;
62import org.onosproject.store.serializers.StoreSerializer;
63import org.slf4j.Logger;
64
65import com.google.common.base.Objects;
66import com.google.common.collect.Lists;
67import com.google.common.collect.Maps;
68import com.google.common.collect.Sets;
69
70/**
71 * Implementation of the MastershipStore on top of Leadership Service.
72 */
Madan Jampani5756c352015-04-29 00:23:58 -070073@Component(immediate = true, enabled = true)
Madan Jampani84b6b402015-02-25 17:49:54 -080074@Service
75public class ConsistentDeviceMastershipStore
76 extends AbstractStore<MastershipEvent, MastershipStoreDelegate>
77 implements MastershipStore {
78
79 private final Logger log = getLogger(getClass());
80
81 @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY)
82 protected LeadershipService leadershipService;
83
84 @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY)
85 protected ClusterService clusterService;
86
87 @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY)
88 protected ClusterCommunicationService clusterCommunicator;
89
90 private NodeId localNodeId;
91 private final Set<DeviceId> connectedDevices = Sets.newHashSet();
92
Madan Jampani84b6b402015-02-25 17:49:54 -080093 private static final MessageSubject ROLE_RELINQUISH_SUBJECT =
94 new MessageSubject("mastership-store-device-role-relinquish");
Madan Jampani9bd1f152015-04-30 23:33:35 -070095 private static final MessageSubject TRANSITION_FROM_MASTER_TO_STANDBY_SUBJECT =
Madan Jampani1af8e132015-04-30 16:41:18 -070096 new MessageSubject("mastership-store-device-mastership-relinquish");
Madan Jampani84b6b402015-02-25 17:49:54 -080097
98 private static final Pattern DEVICE_MASTERSHIP_TOPIC_PATTERN =
Madan Jampani5756c352015-04-29 00:23:58 -070099 Pattern.compile("device:(.*)");
Madan Jampani84b6b402015-02-25 17:49:54 -0800100
Madan Jampani84b6b402015-02-25 17:49:54 -0800101 private ExecutorService messageHandlingExecutor;
Madan Jampanif7536ab2015-05-07 23:23:23 -0700102 private ScheduledExecutorService transferExecutor;
Madan Jampani84b6b402015-02-25 17:49:54 -0800103 private final LeadershipEventListener leadershipEventListener =
104 new InternalDeviceMastershipEventListener();
105
106 private static final String NODE_ID_NULL = "Node ID cannot be null";
Madan Jampanif7536ab2015-05-07 23:23:23 -0700107 private static final String DEVICE_ID_NULL = "Device ID cannot be null";
108 private static final int WAIT_BEFORE_MASTERSHIP_HANDOFF_MILLIS = 3000;
Madan Jampani84b6b402015-02-25 17:49:54 -0800109
110 public static final StoreSerializer SERIALIZER = new KryoSerializer() {
111 @Override
112 protected void setupKryoPool() {
113 serializerPool = KryoNamespace.newBuilder()
114 .register(KryoNamespaces.API)
115 .register(MastershipRole.class)
116 .register(MastershipEvent.class)
Madan Jampani1af8e132015-04-30 16:41:18 -0700117 .register(MastershipEvent.Type.class)
Madan Jampani84b6b402015-02-25 17:49:54 -0800118 .build();
119 }
120 };
121
122 @Activate
123 public void activate() {
124 messageHandlingExecutor =
Madan Jampanif7536ab2015-05-07 23:23:23 -0700125 Executors.newSingleThreadExecutor(
126 groupedThreads("onos/store/device/mastership", "message-handler"));
127 transferExecutor =
128 Executors.newSingleThreadScheduledExecutor(
129 groupedThreads("onos/store/device/mastership", "mastership-transfer-executor"));
Madan Jampanibbed40422015-05-20 12:00:38 -0700130 clusterCommunicator.addSubscriber(ROLE_RELINQUISH_SUBJECT,
Madan Jampanid46e18f2015-05-04 23:19:33 -0700131 SERIALIZER::decode,
Madan Jampanif7536ab2015-05-07 23:23:23 -0700132 this::relinquishLocalRole,
Madan Jampanid46e18f2015-05-04 23:19:33 -0700133 SERIALIZER::encode,
134 messageHandlingExecutor);
Madan Jampani9bd1f152015-04-30 23:33:35 -0700135 clusterCommunicator.addSubscriber(TRANSITION_FROM_MASTER_TO_STANDBY_SUBJECT,
Madan Jampani1af8e132015-04-30 16:41:18 -0700136 SERIALIZER::decode,
Madan Jampani9bd1f152015-04-30 23:33:35 -0700137 this::transitionFromMasterToStandby,
Madan Jampani1af8e132015-04-30 16:41:18 -0700138 SERIALIZER::encode,
139 messageHandlingExecutor);
Madan Jampani84b6b402015-02-25 17:49:54 -0800140 localNodeId = clusterService.getLocalNode().id();
141 leadershipService.addListener(leadershipEventListener);
142
Madan Jampaniafeebbd2015-05-19 15:26:01 -0700143 log.info("Started");
Madan Jampani84b6b402015-02-25 17:49:54 -0800144 }
145
146 @Deactivate
147 public void deactivate() {
Madan Jampani84b6b402015-02-25 17:49:54 -0800148 clusterCommunicator.removeSubscriber(ROLE_RELINQUISH_SUBJECT);
Madan Jampani9bd1f152015-04-30 23:33:35 -0700149 clusterCommunicator.removeSubscriber(TRANSITION_FROM_MASTER_TO_STANDBY_SUBJECT);
Madan Jampani84b6b402015-02-25 17:49:54 -0800150 messageHandlingExecutor.shutdown();
Madan Jampanif7536ab2015-05-07 23:23:23 -0700151 transferExecutor.shutdown();
Madan Jampani84b6b402015-02-25 17:49:54 -0800152 leadershipService.removeListener(leadershipEventListener);
153
Madan Jampaniafeebbd2015-05-19 15:26:01 -0700154 log.info("Stopped");
Madan Jampani84b6b402015-02-25 17:49:54 -0800155 }
156
157 @Override
Madan Jampanide003d92015-05-11 17:14:20 -0700158 public CompletableFuture<MastershipRole> requestRole(DeviceId deviceId) {
Madan Jampani84b6b402015-02-25 17:49:54 -0800159 checkArgument(deviceId != null, DEVICE_ID_NULL);
160
161 String leadershipTopic = createDeviceMastershipTopic(deviceId);
HIGUCHI Yuta1979f552015-12-28 21:24:26 -0800162 connectedDevices.add(deviceId);
163 return leadershipService.runForLeadership(leadershipTopic)
164 .thenApply(leadership -> {
165 return Objects.equal(localNodeId, leadership.leader())
166 ? MastershipRole.MASTER : MastershipRole.STANDBY;
167 });
Madan Jampani84b6b402015-02-25 17:49:54 -0800168 }
169
170 @Override
171 public MastershipRole getRole(NodeId nodeId, DeviceId deviceId) {
172 checkArgument(nodeId != null, NODE_ID_NULL);
173 checkArgument(deviceId != null, DEVICE_ID_NULL);
174
175 String leadershipTopic = createDeviceMastershipTopic(deviceId);
Madan Jampani207528f2015-06-04 13:25:10 -0700176 NodeId leader = leadershipService.getLeader(leadershipTopic);
Madan Jampani0be32ac2015-06-04 15:18:43 -0700177 if (Objects.equal(nodeId, leader)) {
Madan Jampani84b6b402015-02-25 17:49:54 -0800178 return MastershipRole.MASTER;
179 }
Madan Jampani1b02f822015-05-19 11:01:49 -0700180 return leadershipService.getCandidates(leadershipTopic).contains(nodeId) ?
181 MastershipRole.STANDBY : MastershipRole.NONE;
Madan Jampani84b6b402015-02-25 17:49:54 -0800182 }
183
184 @Override
185 public NodeId getMaster(DeviceId deviceId) {
186 checkArgument(deviceId != null, DEVICE_ID_NULL);
187
188 String leadershipTopic = createDeviceMastershipTopic(deviceId);
Madan Jampani207528f2015-06-04 13:25:10 -0700189 return leadershipService.getLeader(leadershipTopic);
Madan Jampani84b6b402015-02-25 17:49:54 -0800190 }
191
192 @Override
193 public RoleInfo getNodes(DeviceId deviceId) {
194 checkArgument(deviceId != null, DEVICE_ID_NULL);
195
196 Map<NodeId, MastershipRole> roles = Maps.newHashMap();
197 clusterService
198 .getNodes()
Madan Jampani84b6b402015-02-25 17:49:54 -0800199 .forEach((node) -> roles.put(node.id(), getRole(node.id(), deviceId)));
200
201 NodeId master = null;
202 final List<NodeId> standbys = Lists.newLinkedList();
203
Madan Jampani86940d92015-05-06 11:47:57 -0700204 List<NodeId> candidates = leadershipService.getCandidates(createDeviceMastershipTopic(deviceId));
205
Madan Jampani84b6b402015-02-25 17:49:54 -0800206 for (Map.Entry<NodeId, MastershipRole> entry : roles.entrySet()) {
207 if (entry.getValue() == MastershipRole.MASTER) {
208 master = entry.getKey();
209 } else if (entry.getValue() == MastershipRole.STANDBY) {
210 standbys.add(entry.getKey());
211 }
212 }
213
Madan Jampani86940d92015-05-06 11:47:57 -0700214 List<NodeId> sortedStandbyList = candidates.stream().filter(standbys::contains).collect(Collectors.toList());
215
216 return new RoleInfo(master, sortedStandbyList);
Madan Jampani84b6b402015-02-25 17:49:54 -0800217 }
218
219 @Override
220 public Set<DeviceId> getDevices(NodeId nodeId) {
221 checkArgument(nodeId != null, NODE_ID_NULL);
222
223 return leadershipService
224 .ownedTopics(nodeId)
225 .stream()
226 .filter(this::isDeviceMastershipTopic)
227 .map(this::extractDeviceIdFromTopic)
228 .collect(Collectors.toSet());
229 }
230
231 @Override
Madan Jampanif7536ab2015-05-07 23:23:23 -0700232 public CompletableFuture<MastershipEvent> setMaster(NodeId nodeId, DeviceId deviceId) {
Madan Jampani84b6b402015-02-25 17:49:54 -0800233 checkArgument(nodeId != null, NODE_ID_NULL);
234 checkArgument(deviceId != null, DEVICE_ID_NULL);
235
Madan Jampani1af8e132015-04-30 16:41:18 -0700236 NodeId currentMaster = getMaster(deviceId);
237 if (nodeId.equals(currentMaster)) {
Madan Jampanif7536ab2015-05-07 23:23:23 -0700238 return CompletableFuture.completedFuture(null);
Madan Jampani1af8e132015-04-30 16:41:18 -0700239 } else {
240 String leadershipTopic = createDeviceMastershipTopic(deviceId);
241 List<NodeId> candidates = leadershipService.getCandidates(leadershipTopic);
242 if (candidates.isEmpty()) {
Madan Jampanif7536ab2015-05-07 23:23:23 -0700243 return CompletableFuture.completedFuture(null);
Madan Jampani1af8e132015-04-30 16:41:18 -0700244 }
245 if (leadershipService.makeTopCandidate(leadershipTopic, nodeId)) {
Madan Jampanif7536ab2015-05-07 23:23:23 -0700246 CompletableFuture<MastershipEvent> result = new CompletableFuture<>();
247 // There is brief wait before we step down from mastership.
248 // This is to ensure any work that happens when standby preference
249 // order changes can complete. For example: flow entries need to be backed
250 // to the new top standby (ONOS-1883)
251 // FIXME: This potentially introduces a race-condition.
252 // Right now role changes are only forced via CLI.
253 transferExecutor.schedule(() -> {
254 result.complete(transitionFromMasterToStandby(deviceId));
255 }, WAIT_BEFORE_MASTERSHIP_HANDOFF_MILLIS, TimeUnit.MILLISECONDS);
256 return result;
Madan Jampani1af8e132015-04-30 16:41:18 -0700257 } else {
258 log.warn("Failed to promote {} to mastership for {}", nodeId, deviceId);
259 }
260 }
Madan Jampanif7536ab2015-05-07 23:23:23 -0700261 return CompletableFuture.completedFuture(null);
Madan Jampani84b6b402015-02-25 17:49:54 -0800262 }
263
264 @Override
265 public MastershipTerm getTermFor(DeviceId deviceId) {
266 checkArgument(deviceId != null, DEVICE_ID_NULL);
267
268 String leadershipTopic = createDeviceMastershipTopic(deviceId);
269 Leadership leadership = leadershipService.getLeadership(leadershipTopic);
270 return leadership != null ? MastershipTerm.of(leadership.leader(), leadership.epoch()) : null;
271 }
272
273 @Override
Madan Jampanif7536ab2015-05-07 23:23:23 -0700274 public CompletableFuture<MastershipEvent> setStandby(NodeId nodeId, DeviceId deviceId) {
Madan Jampani84b6b402015-02-25 17:49:54 -0800275 checkArgument(nodeId != null, NODE_ID_NULL);
276 checkArgument(deviceId != null, DEVICE_ID_NULL);
277
Madan Jampani1af8e132015-04-30 16:41:18 -0700278 NodeId currentMaster = getMaster(deviceId);
279 if (!nodeId.equals(currentMaster)) {
Madan Jampanif7536ab2015-05-07 23:23:23 -0700280 return CompletableFuture.completedFuture(null);
Madan Jampani1af8e132015-04-30 16:41:18 -0700281 }
Madan Jampanid46e18f2015-05-04 23:19:33 -0700282
283 String leadershipTopic = createDeviceMastershipTopic(deviceId);
284 List<NodeId> candidates = leadershipService.getCandidates(leadershipTopic);
285
286 NodeId newMaster = candidates.stream()
287 .filter(candidate -> !Objects.equal(nodeId, candidate))
288 .findFirst()
289 .orElse(null);
290 log.info("Transitioning to role {} for {}. Next master: {}",
291 newMaster != null ? MastershipRole.STANDBY : MastershipRole.NONE, deviceId, newMaster);
292
293 if (newMaster != null) {
294 return setMaster(newMaster, deviceId);
295 }
296 return relinquishRole(nodeId, deviceId);
Madan Jampani84b6b402015-02-25 17:49:54 -0800297 }
298
299 @Override
Madan Jampanif7536ab2015-05-07 23:23:23 -0700300 public CompletableFuture<MastershipEvent> relinquishRole(NodeId nodeId, DeviceId deviceId) {
Madan Jampani84b6b402015-02-25 17:49:54 -0800301 checkArgument(nodeId != null, NODE_ID_NULL);
302 checkArgument(deviceId != null, DEVICE_ID_NULL);
303
Madan Jampanibbed40422015-05-20 12:00:38 -0700304 if (nodeId.equals(localNodeId)) {
305 return relinquishLocalRole(deviceId);
Madan Jampani84b6b402015-02-25 17:49:54 -0800306 }
Madan Jampanibbed40422015-05-20 12:00:38 -0700307
308 log.debug("Forwarding request to relinquish "
309 + "role for device {} to {}", deviceId, nodeId);
310 return clusterCommunicator.sendAndReceive(
311 deviceId,
312 ROLE_RELINQUISH_SUBJECT,
313 SERIALIZER::encode,
314 SERIALIZER::decode,
315 nodeId);
Madan Jampanif7536ab2015-05-07 23:23:23 -0700316 }
317
Madan Jampanibbed40422015-05-20 12:00:38 -0700318 private CompletableFuture<MastershipEvent> relinquishLocalRole(DeviceId deviceId) {
Madan Jampanif7536ab2015-05-07 23:23:23 -0700319 checkArgument(deviceId != null, DEVICE_ID_NULL);
Madan Jampani84b6b402015-02-25 17:49:54 -0800320
321 // Check if this node is can be managed by this node.
322 if (!connectedDevices.contains(deviceId)) {
Madan Jampanibbed40422015-05-20 12:00:38 -0700323 return CompletableFuture.completedFuture(null);
Madan Jampani84b6b402015-02-25 17:49:54 -0800324 }
325
326 String leadershipTopic = createDeviceMastershipTopic(deviceId);
Madan Jampani9bd1f152015-04-30 23:33:35 -0700327 NodeId currentLeader = leadershipService.getLeader(leadershipTopic);
Madan Jampani84b6b402015-02-25 17:49:54 -0800328
Madan Jampani9bd1f152015-04-30 23:33:35 -0700329 MastershipEvent.Type eventType = Objects.equal(currentLeader, localNodeId)
330 ? MastershipEvent.Type.MASTER_CHANGED
331 : MastershipEvent.Type.BACKUPS_CHANGED;
Madan Jampani84b6b402015-02-25 17:49:54 -0800332
333 connectedDevices.remove(deviceId);
Madan Jampanibbed40422015-05-20 12:00:38 -0700334 return leadershipService.withdraw(leadershipTopic)
335 .thenApply(v -> new MastershipEvent(eventType, deviceId, getNodes(deviceId)));
Madan Jampani84b6b402015-02-25 17:49:54 -0800336 }
337
Madan Jampani9bd1f152015-04-30 23:33:35 -0700338 private MastershipEvent transitionFromMasterToStandby(DeviceId deviceId) {
Madan Jampani1af8e132015-04-30 16:41:18 -0700339 checkArgument(deviceId != null, DEVICE_ID_NULL);
340
341 NodeId currentMaster = getMaster(deviceId);
342 if (currentMaster == null) {
343 return null;
344 }
345
346 if (!currentMaster.equals(localNodeId)) {
347 log.info("Forwarding request to relinquish "
348 + "mastership for device {} to {}", deviceId, currentMaster);
349 return futureGetOrElse(clusterCommunicator.sendAndReceive(
350 deviceId,
Madan Jampani9bd1f152015-04-30 23:33:35 -0700351 TRANSITION_FROM_MASTER_TO_STANDBY_SUBJECT,
Madan Jampani1af8e132015-04-30 16:41:18 -0700352 SERIALIZER::encode,
353 SERIALIZER::decode,
354 currentMaster), null);
355 }
356
Madan Jampani9bd1f152015-04-30 23:33:35 -0700357 return leadershipService.stepdown(createDeviceMastershipTopic(deviceId))
358 ? new MastershipEvent(MastershipEvent.Type.MASTER_CHANGED, deviceId, getNodes(deviceId)) : null;
Madan Jampani1af8e132015-04-30 16:41:18 -0700359 }
360
Madan Jampani84b6b402015-02-25 17:49:54 -0800361 @Override
362 public void relinquishAllRole(NodeId nodeId) {
363 // Noop. LeadershipService already takes care of detecting and purging deadlocks.
364 }
365
Madan Jampani84b6b402015-02-25 17:49:54 -0800366 private class InternalDeviceMastershipEventListener implements LeadershipEventListener {
367 @Override
368 public void event(LeadershipEvent event) {
369 Leadership leadership = event.subject();
370 if (!isDeviceMastershipTopic(leadership.topic())) {
371 return;
372 }
Madan Jampani84b6b402015-02-25 17:49:54 -0800373 DeviceId deviceId = extractDeviceIdFromTopic(leadership.topic());
Thomas Vachuska4b839c72015-05-18 15:43:03 -0700374 switch (event.type()) {
375 case LEADER_ELECTED:
376 notifyDelegate(new MastershipEvent(MASTER_CHANGED, deviceId, getNodes(deviceId)));
377 break;
378 case LEADER_REELECTED:
379 // There is no concept of leader re-election in the new distributed leadership manager.
380 throw new IllegalStateException("Unexpected event type");
381 case LEADER_BOOTED:
382 notifyDelegate(new MastershipEvent(MASTER_CHANGED, deviceId, getNodes(deviceId)));
383 break;
384 case CANDIDATES_CHANGED:
385 notifyDelegate(new MastershipEvent(BACKUPS_CHANGED, deviceId, getNodes(deviceId)));
386 break;
387 default:
388 return;
Madan Jampani84b6b402015-02-25 17:49:54 -0800389 }
390 }
391 }
392
393 private String createDeviceMastershipTopic(DeviceId deviceId) {
Madan Jampani5756c352015-04-29 00:23:58 -0700394 return String.format("device:%s", deviceId.toString());
Madan Jampani84b6b402015-02-25 17:49:54 -0800395 }
396
397 private DeviceId extractDeviceIdFromTopic(String topic) {
398 Matcher m = DEVICE_MASTERSHIP_TOPIC_PATTERN.matcher(topic);
399 if (m.matches()) {
400 return DeviceId.deviceId(m.group(1));
401 } else {
402 throw new IllegalArgumentException("Invalid device mastership topic: " + topic);
403 }
404 }
405
406 private boolean isDeviceMastershipTopic(String topic) {
407 Matcher m = DEVICE_MASTERSHIP_TOPIC_PATTERN.matcher(topic);
408 return m.matches();
409 }
410
Madan Jampanic26eede2015-04-16 11:42:16 -0700411}