blob: 0ef66f435563bcba7ad76f3a42376e4793961a7c [file] [log] [blame]
Thomas Vachuska4f1a60c2014-10-28 13:39:07 -07001/*
Ray Milkey34c95902015-04-15 09:47:53 -07002 * Copyright 2014-2015 Open Networking Laboratory
Thomas Vachuska4f1a60c2014-10-28 13:39:07 -07003 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
Brian O'Connorabafb502014-12-02 22:26:20 -080016package org.onosproject.cluster.impl;
Ayaka Koshibe16609692014-09-23 12:46:15 -070017
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -080018import com.codahale.metrics.Timer;
19import com.codahale.metrics.Timer.Context;
Madan Jampanide003d92015-05-11 17:14:20 -070020import com.google.common.collect.Lists;
21import com.google.common.util.concurrent.Futures;
Ayaka Koshibe16609692014-09-23 12:46:15 -070022import org.apache.felix.scr.annotations.Activate;
tom4a5d1712014-09-23 17:49:39 -070023import org.apache.felix.scr.annotations.Component;
Ayaka Koshibe16609692014-09-23 12:46:15 -070024import org.apache.felix.scr.annotations.Deactivate;
25import org.apache.felix.scr.annotations.Reference;
26import org.apache.felix.scr.annotations.ReferenceCardinality;
tom4a5d1712014-09-23 17:49:39 -070027import org.apache.felix.scr.annotations.Service;
Yuta HIGUCHI6a462832014-11-23 23:56:03 -080028import org.onlab.metrics.MetricsService;
Brian O'Connorabafb502014-12-02 22:26:20 -080029import org.onosproject.cluster.ClusterService;
30import org.onosproject.cluster.ControllerNode;
31import org.onosproject.cluster.NodeId;
32import org.onosproject.cluster.RoleInfo;
Thomas Vachuska42e8cce2015-07-29 19:25:18 -070033import org.onosproject.event.AbstractListenerManager;
Brian O'Connorabafb502014-12-02 22:26:20 -080034import org.onosproject.core.MetricsHelper;
Changhoon Yoon541ef712015-05-23 17:18:34 +090035import org.onosproject.core.Permission;
Brian O'Connorabafb502014-12-02 22:26:20 -080036import org.onosproject.mastership.MastershipAdminService;
37import org.onosproject.mastership.MastershipEvent;
38import org.onosproject.mastership.MastershipListener;
39import org.onosproject.mastership.MastershipService;
40import org.onosproject.mastership.MastershipStore;
41import org.onosproject.mastership.MastershipStoreDelegate;
42import org.onosproject.mastership.MastershipTerm;
43import org.onosproject.mastership.MastershipTermService;
44import org.onosproject.net.DeviceId;
45import org.onosproject.net.MastershipRole;
Ayaka Koshibe16609692014-09-23 12:46:15 -070046import org.slf4j.Logger;
47
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -080048import java.util.Collection;
Thomas Vachuska12dfdc32014-11-29 16:03:12 -080049import java.util.HashMap;
50import java.util.HashSet;
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -080051import java.util.Iterator;
52import java.util.List;
Thomas Vachuska12dfdc32014-11-29 16:03:12 -080053import java.util.Map;
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -080054import java.util.Set;
Madan Jampanif7536ab2015-05-07 23:23:23 -070055import java.util.concurrent.CompletableFuture;
56
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -080057import static com.google.common.base.Preconditions.checkNotNull;
58import static com.google.common.collect.Lists.newArrayList;
59import static org.onlab.metrics.MetricsUtil.startTimer;
60import static org.onlab.metrics.MetricsUtil.stopTimer;
Brian O'Connorabafb502014-12-02 22:26:20 -080061import static org.onosproject.cluster.ControllerNode.State.ACTIVE;
62import static org.onosproject.net.MastershipRole.MASTER;
Changhoon Yoon541ef712015-05-23 17:18:34 +090063import static org.onosproject.security.AppGuard.checkPermission;
Thomas Vachuska42e8cce2015-07-29 19:25:18 -070064import static org.slf4j.LoggerFactory.getLogger;
Changhoon Yoon541ef712015-05-23 17:18:34 +090065
Yuta HIGUCHI6a462832014-11-23 23:56:03 -080066
tom4a5d1712014-09-23 17:49:39 -070067@Component(immediate = true)
68@Service
Ayaka Koshibe3eed2b02014-09-23 13:28:05 -070069public class MastershipManager
Thomas Vachuska42e8cce2015-07-29 19:25:18 -070070 extends AbstractListenerManager<MastershipEvent, MastershipListener>
Yuta HIGUCHIa22f69f2014-11-24 22:25:17 -080071 implements MastershipService, MastershipAdminService, MastershipTermService,
72 MetricsHelper {
Ayaka Koshibe16609692014-09-23 12:46:15 -070073
74 private static final String NODE_ID_NULL = "Node ID cannot be null";
75 private static final String DEVICE_ID_NULL = "Device ID cannot be null";
76 private static final String ROLE_NULL = "Mastership role cannot be null";
77
78 private final Logger log = getLogger(getClass());
79
alshabib339a3d92014-09-26 17:54:32 -070080 private final MastershipStoreDelegate delegate = new InternalDelegate();
Ayaka Koshibe16609692014-09-23 12:46:15 -070081
82 @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY)
83 protected MastershipStore store;
84
85 @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY)
tom4a5d1712014-09-23 17:49:39 -070086 protected ClusterService clusterService;
Ayaka Koshibe16609692014-09-23 12:46:15 -070087
Yuta HIGUCHI6a462832014-11-23 23:56:03 -080088 @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY)
89 protected MetricsService metricsService;
90
Madan Jampanic6e574f2015-05-29 13:41:52 -070091 private NodeId localNodeId;
Yuta HIGUCHI6a462832014-11-23 23:56:03 -080092 private Timer requestRoleTimer;
Ayaka Koshibe3de43ca2014-09-26 16:40:23 -070093
Ayaka Koshibe16609692014-09-23 12:46:15 -070094 @Activate
95 public void activate() {
Yuta HIGUCHI6a462832014-11-23 23:56:03 -080096 requestRoleTimer = createTimer("Mastership", "requestRole", "responseTime");
Madan Jampanic6e574f2015-05-29 13:41:52 -070097 localNodeId = clusterService.getLocalNode().id();
Ayaka Koshibe16609692014-09-23 12:46:15 -070098 eventDispatcher.addSink(MastershipEvent.class, listenerRegistry);
alshabib339a3d92014-09-26 17:54:32 -070099 store.setDelegate(delegate);
Ayaka Koshibe16609692014-09-23 12:46:15 -0700100 log.info("Started");
101 }
102
103 @Deactivate
104 public void deactivate() {
105 eventDispatcher.removeSink(MastershipEvent.class);
alshabib339a3d92014-09-26 17:54:32 -0700106 store.unsetDelegate(delegate);
Ayaka Koshibe16609692014-09-23 12:46:15 -0700107 log.info("Stopped");
108 }
109
Ayaka Koshibe16609692014-09-23 12:46:15 -0700110 @Override
Madan Jampanide003d92015-05-11 17:14:20 -0700111 public CompletableFuture<Void> setRole(NodeId nodeId, DeviceId deviceId, MastershipRole role) {
Ayaka Koshibe16609692014-09-23 12:46:15 -0700112 checkNotNull(nodeId, NODE_ID_NULL);
113 checkNotNull(deviceId, DEVICE_ID_NULL);
114 checkNotNull(role, ROLE_NULL);
Ayaka Koshibed9f693e2014-09-29 18:04:54 -0700115
Madan Jampanif7536ab2015-05-07 23:23:23 -0700116 CompletableFuture<MastershipEvent> eventFuture = null;
Ayaka Koshibee60d4522014-10-28 15:07:00 -0700117
118 switch (role) {
119 case MASTER:
Madan Jampanif7536ab2015-05-07 23:23:23 -0700120 eventFuture = store.setMaster(nodeId, deviceId);
Ayaka Koshibee60d4522014-10-28 15:07:00 -0700121 break;
122 case STANDBY:
Madan Jampanif7536ab2015-05-07 23:23:23 -0700123 eventFuture = store.setStandby(nodeId, deviceId);
Ayaka Koshibee60d4522014-10-28 15:07:00 -0700124 break;
125 case NONE:
Madan Jampanif7536ab2015-05-07 23:23:23 -0700126 eventFuture = store.relinquishRole(nodeId, deviceId);
Ayaka Koshibee60d4522014-10-28 15:07:00 -0700127 break;
128 default:
129 log.info("Unknown role; ignoring");
Madan Jampanide003d92015-05-11 17:14:20 -0700130 return CompletableFuture.completedFuture(null);
Ayaka Koshibe971a38a2014-09-30 11:56:23 -0700131 }
Ayaka Koshibed9f693e2014-09-29 18:04:54 -0700132
Madan Jampanic6e574f2015-05-29 13:41:52 -0700133 return eventFuture.thenAccept(this::post)
134 .thenApply(v -> null);
Ayaka Koshibe16609692014-09-23 12:46:15 -0700135 }
136
137 @Override
tomb41d1ac2014-09-24 01:51:24 -0700138 public MastershipRole getLocalRole(DeviceId deviceId) {
Changhoon Yoon541ef712015-05-23 17:18:34 +0900139 checkPermission(Permission.CLUSTER_READ);
140
tomb41d1ac2014-09-24 01:51:24 -0700141 checkNotNull(deviceId, DEVICE_ID_NULL);
142 return store.getRole(clusterService.getLocalNode().id(), deviceId);
143 }
144
145 @Override
Madan Jampanic6e574f2015-05-29 13:41:52 -0700146 public CompletableFuture<Void> relinquishMastership(DeviceId deviceId) {
Changhoon Yoon541ef712015-05-23 17:18:34 +0900147 checkPermission(Permission.CLUSTER_WRITE);
Madan Jampanic6e574f2015-05-29 13:41:52 -0700148 return store.relinquishRole(localNodeId, deviceId)
149 .thenAccept(this::post)
150 .thenApply(v -> null);
tomb41d1ac2014-09-24 01:51:24 -0700151 }
152
153 @Override
Madan Jampanide003d92015-05-11 17:14:20 -0700154 public CompletableFuture<MastershipRole> requestRoleFor(DeviceId deviceId) {
Changhoon Yoon541ef712015-05-23 17:18:34 +0900155 checkPermission(Permission.CLUSTER_WRITE);
156
tomb41d1ac2014-09-24 01:51:24 -0700157 checkNotNull(deviceId, DEVICE_ID_NULL);
Yuta HIGUCHI6a462832014-11-23 23:56:03 -0800158 final Context timer = startTimer(requestRoleTimer);
Madan Jampanide003d92015-05-11 17:14:20 -0700159 return store.requestRole(deviceId).whenComplete((result, error) -> stopTimer(timer));
160
tomb41d1ac2014-09-24 01:51:24 -0700161 }
162
163 @Override
Ayaka Koshibe16609692014-09-23 12:46:15 -0700164 public NodeId getMasterFor(DeviceId deviceId) {
Changhoon Yoon541ef712015-05-23 17:18:34 +0900165 checkPermission(Permission.CLUSTER_READ);
166
Ayaka Koshibe16609692014-09-23 12:46:15 -0700167 checkNotNull(deviceId, DEVICE_ID_NULL);
168 return store.getMaster(deviceId);
169 }
170
171 @Override
172 public Set<DeviceId> getDevicesOf(NodeId nodeId) {
Changhoon Yoon541ef712015-05-23 17:18:34 +0900173 checkPermission(Permission.CLUSTER_READ);
174
Ayaka Koshibe16609692014-09-23 12:46:15 -0700175 checkNotNull(nodeId, NODE_ID_NULL);
176 return store.getDevices(nodeId);
177 }
178
Ayaka Koshibe45503ce2014-10-14 11:26:45 -0700179 @Override
Ayaka Koshibeabedb092014-10-20 17:01:31 -0700180 public RoleInfo getNodesFor(DeviceId deviceId) {
Changhoon Yoon541ef712015-05-23 17:18:34 +0900181 checkPermission(Permission.CLUSTER_READ);
182
Ayaka Koshibe45503ce2014-10-14 11:26:45 -0700183 checkNotNull(deviceId, DEVICE_ID_NULL);
184 return store.getNodes(deviceId);
185 }
Ayaka Koshibeb70d34b2014-09-25 15:43:01 -0700186
187 @Override
Yuta HIGUCHIbcac4992014-11-22 19:27:57 -0800188 public MastershipTerm getMastershipTerm(DeviceId deviceId) {
189 return store.getTermFor(deviceId);
Ayaka Koshibeb70d34b2014-09-25 15:43:01 -0700190 }
191
Ayaka Koshibe16609692014-09-23 12:46:15 -0700192 @Override
Yuta HIGUCHIa22f69f2014-11-24 22:25:17 -0800193 public MetricsService metricsService() {
194 return metricsService;
195 }
Ayaka Koshibe16609692014-09-23 12:46:15 -0700196
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800197 @Override
198 public void balanceRoles() {
199 List<ControllerNode> nodes = newArrayList(clusterService.getNodes());
Thomas Vachuska12dfdc32014-11-29 16:03:12 -0800200 Map<ControllerNode, Set<DeviceId>> controllerDevices = new HashMap<>();
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800201 int deviceCount = 0;
202
203 // Create buckets reflecting current ownership.
204 for (ControllerNode node : nodes) {
Thomas Vachuska12dfdc32014-11-29 16:03:12 -0800205 if (clusterService.getState(node.id()) == ACTIVE) {
206 Set<DeviceId> devicesOf = new HashSet<>(getDevicesOf(node.id()));
207 deviceCount += devicesOf.size();
208 controllerDevices.put(node, devicesOf);
209 log.info("Node {} has {} devices.", node.id(), devicesOf.size());
210 }
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800211 }
212
Thomas Vachuska12dfdc32014-11-29 16:03:12 -0800213 // Now re-balance the buckets until they are roughly even.
Madan Jampanide003d92015-05-11 17:14:20 -0700214 List<CompletableFuture<Void>> balanceBucketsFutures = Lists.newLinkedList();
Thomas Vachuska12dfdc32014-11-29 16:03:12 -0800215 int rounds = controllerDevices.keySet().size();
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800216 for (int i = 0; i < rounds; i++) {
217 // Iterate over the buckets and find the smallest and the largest.
Thomas Vachuska12dfdc32014-11-29 16:03:12 -0800218 ControllerNode smallest = findBucket(true, controllerDevices);
219 ControllerNode largest = findBucket(false, controllerDevices);
Madan Jampanide003d92015-05-11 17:14:20 -0700220 balanceBucketsFutures.add(balanceBuckets(smallest, largest, controllerDevices, deviceCount));
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800221 }
Madan Jampanide003d92015-05-11 17:14:20 -0700222 CompletableFuture<Void> balanceRolesFuture = CompletableFuture.allOf(
223 balanceBucketsFutures.toArray(new CompletableFuture[balanceBucketsFutures.size()]));
224
225 Futures.getUnchecked(balanceRolesFuture);
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800226 }
227
Thomas Vachuska12dfdc32014-11-29 16:03:12 -0800228 private ControllerNode findBucket(boolean min,
229 Map<ControllerNode, Set<DeviceId>> controllerDevices) {
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800230 int xSize = min ? Integer.MAX_VALUE : -1;
231 ControllerNode xNode = null;
Thomas Vachuska12dfdc32014-11-29 16:03:12 -0800232 for (ControllerNode node : controllerDevices.keySet()) {
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800233 int size = controllerDevices.get(node).size();
234 if ((min && size < xSize) || (!min && size > xSize)) {
235 xSize = size;
236 xNode = node;
237 }
238 }
239 return xNode;
240 }
241
Madan Jampanide003d92015-05-11 17:14:20 -0700242 private CompletableFuture<Void> balanceBuckets(ControllerNode smallest, ControllerNode largest,
Thomas Vachuska12dfdc32014-11-29 16:03:12 -0800243 Map<ControllerNode, Set<DeviceId>> controllerDevices,
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800244 int deviceCount) {
245 Collection<DeviceId> minBucket = controllerDevices.get(smallest);
246 Collection<DeviceId> maxBucket = controllerDevices.get(largest);
247 int bucketCount = controllerDevices.keySet().size();
248
249 int delta = (maxBucket.size() - minBucket.size()) / 2;
250 delta = Math.min(deviceCount / bucketCount, delta);
251
Madan Jampanide003d92015-05-11 17:14:20 -0700252 List<CompletableFuture<Void>> setRoleFutures = Lists.newLinkedList();
253
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800254 if (delta > 0) {
255 log.info("Attempting to move {} nodes from {} to {}...", delta,
256 largest.id(), smallest.id());
257
258 int i = 0;
259 Iterator<DeviceId> it = maxBucket.iterator();
260 while (it.hasNext() && i < delta) {
261 DeviceId deviceId = it.next();
262 log.info("Setting {} as the master for {}", smallest.id(), deviceId);
Madan Jampanide003d92015-05-11 17:14:20 -0700263 setRoleFutures.add(setRole(smallest.id(), deviceId, MASTER));
Thomas Vachuska12dfdc32014-11-29 16:03:12 -0800264 controllerDevices.get(smallest).add(deviceId);
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800265 it.remove();
266 i++;
267 }
268 }
Madan Jampanide003d92015-05-11 17:14:20 -0700269
270 return CompletableFuture.allOf(setRoleFutures.toArray(new CompletableFuture[setRoleFutures.size()]));
Thomas Vachuska1e68bdd2014-11-29 13:53:10 -0800271 }
272
273
alshabib339a3d92014-09-26 17:54:32 -0700274 public class InternalDelegate implements MastershipStoreDelegate {
alshabib339a3d92014-09-26 17:54:32 -0700275 @Override
276 public void notify(MastershipEvent event) {
Thomas Vachuska42e8cce2015-07-29 19:25:18 -0700277 post(event);
alshabib339a3d92014-09-26 17:54:32 -0700278 }
alshabib339a3d92014-09-26 17:54:32 -0700279 }
280
Ayaka Koshibe16609692014-09-23 12:46:15 -0700281}