tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 1 | package org.onlab.onos.store.cluster.impl; |
| 2 | |
alshabib | 339a3d9 | 2014-09-26 17:54:32 -0700 | [diff] [blame] | 3 | import static org.onlab.onos.cluster.MastershipEvent.Type.MASTER_CHANGED; |
| 4 | |
| 5 | import java.util.Map; |
alshabib | 339a3d9 | 2014-09-26 17:54:32 -0700 | [diff] [blame] | 6 | import java.util.Set; |
Yuta HIGUCHI | c8e19d4 | 2014-09-24 17:20:52 -0700 | [diff] [blame] | 7 | |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 8 | import org.apache.felix.scr.annotations.Activate; |
| 9 | import org.apache.felix.scr.annotations.Component; |
| 10 | import org.apache.felix.scr.annotations.Deactivate; |
| 11 | import org.apache.felix.scr.annotations.Reference; |
| 12 | import org.apache.felix.scr.annotations.ReferenceCardinality; |
Ayaka Koshibe | 25fd23a | 2014-10-03 15:50:43 -0700 | [diff] [blame^] | 13 | import org.apache.felix.scr.annotations.ReferencePolicy; |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 14 | import org.apache.felix.scr.annotations.Service; |
| 15 | import org.onlab.onos.cluster.ClusterService; |
| 16 | import org.onlab.onos.cluster.MastershipEvent; |
| 17 | import org.onlab.onos.cluster.MastershipStore; |
tom | 0755a36 | 2014-09-24 11:54:43 -0700 | [diff] [blame] | 18 | import org.onlab.onos.cluster.MastershipStoreDelegate; |
Ayaka Koshibe | b70d34b | 2014-09-25 15:43:01 -0700 | [diff] [blame] | 19 | import org.onlab.onos.cluster.MastershipTerm; |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 20 | import org.onlab.onos.cluster.NodeId; |
| 21 | import org.onlab.onos.net.DeviceId; |
| 22 | import org.onlab.onos.net.MastershipRole; |
Ayaka Koshibe | 25fd23a | 2014-10-03 15:50:43 -0700 | [diff] [blame^] | 23 | import org.onlab.onos.net.device.DeviceService; |
Yuta HIGUCHI | b5df76d | 2014-09-27 20:54:00 -0700 | [diff] [blame] | 24 | import org.onlab.onos.store.common.AbstractHazelcastStore; |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 25 | |
alshabib | 339a3d9 | 2014-09-26 17:54:32 -0700 | [diff] [blame] | 26 | import com.google.common.collect.ImmutableSet; |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 27 | import com.hazelcast.core.ILock; |
alshabib | 339a3d9 | 2014-09-26 17:54:32 -0700 | [diff] [blame] | 28 | import com.hazelcast.core.IMap; |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 29 | |
| 30 | /** |
| 31 | * Distributed implementation of the cluster nodes store. |
| 32 | */ |
| 33 | @Component(immediate = true) |
| 34 | @Service |
tom | 0755a36 | 2014-09-24 11:54:43 -0700 | [diff] [blame] | 35 | public class DistributedMastershipStore |
Yuta HIGUCHI | 2e96389 | 2014-09-27 13:00:39 -0700 | [diff] [blame] | 36 | extends AbstractHazelcastStore<MastershipEvent, MastershipStoreDelegate> |
alshabib | 339a3d9 | 2014-09-26 17:54:32 -0700 | [diff] [blame] | 37 | implements MastershipStore { |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 38 | |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 39 | //arbitrary lock name |
| 40 | private static final String LOCK = "lock"; |
| 41 | //initial term value |
| 42 | private static final Integer INIT = 0; |
| 43 | //placeholder non-null value |
| 44 | private static final Byte NIL = 0x0; |
| 45 | |
| 46 | //devices to masters |
| 47 | protected IMap<byte[], byte[]> rawMasters; |
| 48 | //devices to terms |
| 49 | protected IMap<byte[], Integer> rawTerms; |
| 50 | //collection of nodes. values are ignored, as it's used as a makeshift 'set' |
| 51 | protected IMap<byte[], Byte> backups; |
| 52 | |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 53 | @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY) |
| 54 | protected ClusterService clusterService; |
| 55 | |
Ayaka Koshibe | 25fd23a | 2014-10-03 15:50:43 -0700 | [diff] [blame^] | 56 | //FIXME: need to guarantee that this will be met, sans circular dependencies |
| 57 | @Reference(policy = ReferencePolicy.DYNAMIC) |
| 58 | protected DeviceService deviceService; |
| 59 | |
Ayaka Koshibe | 406d010 | 2014-09-24 16:08:12 -0700 | [diff] [blame] | 60 | @Override |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 61 | @Activate |
| 62 | public void activate() { |
| 63 | super.activate(); |
| 64 | |
| 65 | rawMasters = theInstance.getMap("masters"); |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 66 | rawTerms = theInstance.getMap("terms"); |
| 67 | backups = theInstance.getMap("backups"); |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 68 | |
Ayaka Koshibe | 5c0f237 | 2014-10-02 17:59:04 -0700 | [diff] [blame] | 69 | rawMasters.addEntryListener(new RemoteMasterShipEventHandler(), true); |
Yuta HIGUCHI | c8e19d4 | 2014-09-24 17:20:52 -0700 | [diff] [blame] | 70 | |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 71 | log.info("Started"); |
| 72 | } |
| 73 | |
| 74 | @Deactivate |
| 75 | public void deactivate() { |
| 76 | log.info("Stopped"); |
| 77 | } |
| 78 | |
| 79 | @Override |
Ayaka Koshibe | 406d010 | 2014-09-24 16:08:12 -0700 | [diff] [blame] | 80 | public MastershipEvent setMaster(NodeId nodeId, DeviceId deviceId) { |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 81 | byte [] did = serialize(deviceId); |
| 82 | byte [] nid = serialize(nodeId); |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 83 | |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 84 | ILock lock = theInstance.getLock(LOCK); |
| 85 | lock.lock(); |
| 86 | try { |
| 87 | MastershipRole role = getRole(nodeId, deviceId); |
| 88 | Integer term = rawTerms.get(did); |
| 89 | switch (role) { |
| 90 | case MASTER: |
| 91 | return null; |
| 92 | case STANDBY: |
| 93 | rawMasters.put(did, nid); |
| 94 | rawTerms.put(did, ++term); |
| 95 | backups.putIfAbsent(nid, NIL); |
| 96 | break; |
| 97 | case NONE: |
| 98 | rawMasters.put(did, nid); |
| 99 | //new switch OR state transition after being orphaned |
| 100 | if (term == null) { |
| 101 | rawTerms.put(did, INIT); |
| 102 | } else { |
| 103 | rawTerms.put(did, ++term); |
| 104 | } |
| 105 | backups.put(nid, NIL); |
| 106 | break; |
| 107 | default: |
| 108 | log.warn("unknown Mastership Role {}", role); |
| 109 | return null; |
| 110 | } |
| 111 | return new MastershipEvent(MASTER_CHANGED, deviceId, nodeId); |
| 112 | } finally { |
| 113 | lock.unlock(); |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 114 | } |
| 115 | } |
| 116 | |
| 117 | @Override |
| 118 | public NodeId getMaster(DeviceId deviceId) { |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 119 | return deserialize(rawMasters.get(serialize(deviceId))); |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 120 | } |
| 121 | |
| 122 | @Override |
| 123 | public Set<DeviceId> getDevices(NodeId nodeId) { |
| 124 | ImmutableSet.Builder<DeviceId> builder = ImmutableSet.builder(); |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 125 | |
| 126 | for (Map.Entry<byte[], byte[]> entry : rawMasters.entrySet()) { |
| 127 | if (nodeId.equals(deserialize(entry.getValue()))) { |
| 128 | builder.add((DeviceId) deserialize(entry.getKey())); |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 129 | } |
| 130 | } |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 131 | |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 132 | return builder.build(); |
| 133 | } |
| 134 | |
| 135 | @Override |
| 136 | public MastershipRole requestRole(DeviceId deviceId) { |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 137 | // first to empty slot for device in master map is MASTER |
| 138 | // depending on how backups are organized, might need to trigger election |
| 139 | // so only controller doesn't set itself to backup for another device |
| 140 | byte [] did = serialize(deviceId); |
| 141 | NodeId local = clusterService.getLocalNode().id(); |
| 142 | byte [] lnid = serialize(local); |
| 143 | |
| 144 | ILock lock = theInstance.getLock(LOCK); |
| 145 | lock.lock(); |
| 146 | try { |
| 147 | MastershipRole role = getRole(local, deviceId); |
| 148 | switch (role) { |
| 149 | case MASTER: |
| 150 | break; |
| 151 | case STANDBY: |
| 152 | backups.put(lnid, NIL); |
| 153 | rawTerms.putIfAbsent(did, INIT); |
| 154 | break; |
| 155 | case NONE: |
| 156 | rawMasters.put(did, lnid); |
| 157 | rawTerms.putIfAbsent(did, INIT); |
| 158 | backups.put(lnid, NIL); |
| 159 | role = MastershipRole.MASTER; |
| 160 | break; |
| 161 | default: |
| 162 | log.warn("unknown Mastership Role {}", role); |
| 163 | } |
| 164 | return role; |
| 165 | } finally { |
| 166 | lock.unlock(); |
| 167 | } |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 168 | } |
| 169 | |
| 170 | @Override |
| 171 | public MastershipRole getRole(NodeId nodeId, DeviceId deviceId) { |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 172 | byte[] did = serialize(deviceId); |
| 173 | |
| 174 | NodeId current = deserialize(rawMasters.get(did)); |
| 175 | MastershipRole role = null; |
| 176 | |
| 177 | if (current == null) { |
| 178 | //IFF no controllers have claimed mastership over it |
| 179 | role = MastershipRole.NONE; |
| 180 | } else { |
| 181 | if (current.equals(nodeId)) { |
| 182 | role = MastershipRole.MASTER; |
| 183 | } else { |
| 184 | role = MastershipRole.STANDBY; |
| 185 | } |
| 186 | } |
| 187 | |
| 188 | return role; |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 189 | } |
| 190 | |
Ayaka Koshibe | b70d34b | 2014-09-25 15:43:01 -0700 | [diff] [blame] | 191 | @Override |
| 192 | public MastershipTerm getTermFor(DeviceId deviceId) { |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 193 | byte[] did = serialize(deviceId); |
| 194 | |
| 195 | if ((rawMasters.get(did) == null) || |
| 196 | (rawTerms.get(did) == null)) { |
| 197 | return null; |
| 198 | } |
| 199 | return MastershipTerm.of( |
| 200 | (NodeId) deserialize(rawMasters.get(did)), rawTerms.get(did)); |
Ayaka Koshibe | b70d34b | 2014-09-25 15:43:01 -0700 | [diff] [blame] | 201 | } |
| 202 | |
Ayaka Koshibe | d9f693e | 2014-09-29 18:04:54 -0700 | [diff] [blame] | 203 | @Override |
| 204 | public MastershipEvent unsetMaster(NodeId nodeId, DeviceId deviceId) { |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 205 | byte [] did = serialize(deviceId); |
| 206 | |
| 207 | ILock lock = theInstance.getLock(LOCK); |
| 208 | lock.lock(); |
| 209 | try { |
| 210 | MastershipRole role = getRole(nodeId, deviceId); |
| 211 | switch (role) { |
| 212 | case MASTER: |
| 213 | //hand off device to another |
| 214 | NodeId backup = reelect(nodeId, deviceId); |
| 215 | if (backup == null) { |
| 216 | //goes back to NONE |
| 217 | rawMasters.remove(did); |
| 218 | } else { |
| 219 | //goes to STANDBY for local, MASTER for someone else |
| 220 | Integer term = rawTerms.get(did); |
| 221 | rawMasters.put(did, serialize(backup)); |
| 222 | rawTerms.put(did, ++term); |
| 223 | return new MastershipEvent(MASTER_CHANGED, deviceId, backup); |
| 224 | } |
| 225 | case STANDBY: |
| 226 | case NONE: |
| 227 | break; |
| 228 | default: |
| 229 | log.warn("unknown Mastership Role {}", role); |
| 230 | } |
| 231 | return null; |
| 232 | } finally { |
| 233 | lock.unlock(); |
| 234 | } |
| 235 | } |
| 236 | |
| 237 | //helper for "re-electing" a new master for a given device |
| 238 | private NodeId reelect(NodeId current, DeviceId deviceId) { |
Ayaka Koshibe | 25fd23a | 2014-10-03 15:50:43 -0700 | [diff] [blame^] | 239 | |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 240 | for (byte [] node : backups.keySet()) { |
| 241 | NodeId nid = deserialize(node); |
Ayaka Koshibe | 25fd23a | 2014-10-03 15:50:43 -0700 | [diff] [blame^] | 242 | //if a device dies we shouldn't pick another master for it. |
| 243 | if (!current.equals(nid) && (deviceService.isAvailable(deviceId))) { |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 244 | return nid; |
| 245 | } |
| 246 | } |
Ayaka Koshibe | d9f693e | 2014-09-29 18:04:54 -0700 | [diff] [blame] | 247 | return null; |
| 248 | } |
| 249 | |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 250 | //adds node to pool(s) of backup |
| 251 | private void backup(NodeId nodeId, DeviceId deviceId) { |
Ayaka Koshibe | 5c0f237 | 2014-10-02 17:59:04 -0700 | [diff] [blame] | 252 | //TODO might be useful to isolate out this function and reelect() if we |
| 253 | //get more backup/election schemes |
Ayaka Koshibe | 8583ff3 | 2014-10-02 16:25:30 -0700 | [diff] [blame] | 254 | } |
| 255 | |
Ayaka Koshibe | 5c0f237 | 2014-10-02 17:59:04 -0700 | [diff] [blame] | 256 | private class RemoteMasterShipEventHandler extends RemoteEventHandler<DeviceId, NodeId> { |
alshabib | 339a3d9 | 2014-09-26 17:54:32 -0700 | [diff] [blame] | 257 | |
| 258 | @Override |
| 259 | protected void onAdd(DeviceId deviceId, NodeId nodeId) { |
Ayaka Koshibe | 5c0f237 | 2014-10-02 17:59:04 -0700 | [diff] [blame] | 260 | //only addition indicates a change in mastership |
alshabib | 339a3d9 | 2014-09-26 17:54:32 -0700 | [diff] [blame] | 261 | notifyDelegate(new MastershipEvent(MASTER_CHANGED, deviceId, nodeId)); |
| 262 | } |
| 263 | |
| 264 | @Override |
| 265 | protected void onRemove(DeviceId deviceId, NodeId nodeId) { |
Ayaka Koshibe | 5c0f237 | 2014-10-02 17:59:04 -0700 | [diff] [blame] | 266 | //notifyDelegate(new MastershipEvent(MASTER_CHANGED, deviceId, nodeId)); |
alshabib | 339a3d9 | 2014-09-26 17:54:32 -0700 | [diff] [blame] | 267 | } |
| 268 | |
| 269 | @Override |
| 270 | protected void onUpdate(DeviceId deviceId, NodeId oldNodeId, NodeId nodeId) { |
Ayaka Koshibe | 5c0f237 | 2014-10-02 17:59:04 -0700 | [diff] [blame] | 271 | //notifyDelegate(new MastershipEvent(MASTER_CHANGED, deviceId, nodeId)); |
alshabib | 339a3d9 | 2014-09-26 17:54:32 -0700 | [diff] [blame] | 272 | } |
| 273 | } |
| 274 | |
tom | b41d1ac | 2014-09-24 01:51:24 -0700 | [diff] [blame] | 275 | } |