tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 1 | package org.onlab.onos.store.cluster.impl; |
| 2 | |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 3 | import com.google.common.cache.Cache; |
| 4 | import com.google.common.cache.CacheBuilder; |
| 5 | import com.google.common.cache.RemovalListener; |
| 6 | import com.google.common.cache.RemovalNotification; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 7 | import com.google.common.collect.ImmutableSet; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 8 | |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 9 | import org.apache.felix.scr.annotations.Activate; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 10 | import org.apache.felix.scr.annotations.Deactivate; |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 11 | import org.apache.felix.scr.annotations.Reference; |
| 12 | import org.apache.felix.scr.annotations.ReferenceCardinality; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 13 | import org.onlab.onos.cluster.ClusterEvent; |
| 14 | import org.onlab.onos.cluster.ClusterStore; |
| 15 | import org.onlab.onos.cluster.ClusterStoreDelegate; |
| 16 | import org.onlab.onos.cluster.ControllerNode; |
| 17 | import org.onlab.onos.cluster.DefaultControllerNode; |
| 18 | import org.onlab.onos.cluster.NodeId; |
| 19 | import org.onlab.onos.store.AbstractStore; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 20 | import org.onlab.onos.store.cluster.messaging.ClusterCommunicationAdminService; |
Madan Jampani | 3b0dfd5 | 2014-10-02 16:48:13 -0700 | [diff] [blame] | 21 | import org.onlab.onos.store.cluster.messaging.impl.ClusterCommunicationManager; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 22 | import org.onlab.packet.IpPrefix; |
| 23 | import org.slf4j.Logger; |
| 24 | import org.slf4j.LoggerFactory; |
| 25 | |
| 26 | import java.io.IOException; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 27 | import java.util.Map; |
| 28 | import java.util.Set; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 29 | import java.util.concurrent.ConcurrentHashMap; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 30 | import java.util.concurrent.TimeUnit; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 31 | |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 32 | import static org.onlab.onos.cluster.ControllerNode.State; |
| 33 | import static org.onlab.packet.IpPrefix.valueOf; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 34 | |
| 35 | /** |
| 36 | * Distributed implementation of the cluster nodes store. |
| 37 | */ |
Yuta HIGUCHI | 3215ebd | 2014-10-07 14:24:37 -0700 | [diff] [blame^] | 38 | //@Component(immediate = true) |
| 39 | //@Service |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 40 | public class DistributedClusterStore |
| 41 | extends AbstractStore<ClusterEvent, ClusterStoreDelegate> |
| 42 | implements ClusterStore { |
| 43 | |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 44 | private final Logger log = LoggerFactory.getLogger(getClass()); |
| 45 | |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 46 | private DefaultControllerNode localNode; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 47 | private final Map<NodeId, DefaultControllerNode> nodes = new ConcurrentHashMap<>(); |
| 48 | private final Map<NodeId, State> states = new ConcurrentHashMap<>(); |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 49 | private final Cache<NodeId, ControllerNode> livenessCache = CacheBuilder.newBuilder() |
| 50 | .maximumSize(1000) |
Madan Jampani | 3b0dfd5 | 2014-10-02 16:48:13 -0700 | [diff] [blame] | 51 | .expireAfterWrite(ClusterCommunicationManager.HEART_BEAT_INTERVAL_MILLIS * 3, TimeUnit.MILLISECONDS) |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 52 | .removalListener(new LivenessCacheRemovalListener()).build(); |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 53 | |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 54 | @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY) |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 55 | private ClusterCommunicationAdminService clusterCommunicationAdminService; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 56 | |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 57 | private final ClusterNodesDelegate nodesDelegate = new InnerNodesDelegate(); |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 58 | |
| 59 | @Activate |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 60 | public void activate() throws IOException { |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 61 | loadClusterDefinition(); |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 62 | establishSelfIdentity(); |
tom | 8158314 | 2014-09-30 01:40:29 -0700 | [diff] [blame] | 63 | |
| 64 | // Start-up the comm service and prime it with the loaded nodes. |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 65 | clusterCommunicationAdminService.initialize(localNode, nodesDelegate); |
tom | 8158314 | 2014-09-30 01:40:29 -0700 | [diff] [blame] | 66 | for (DefaultControllerNode node : nodes.values()) { |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 67 | clusterCommunicationAdminService.addNode(node); |
tom | 8158314 | 2014-09-30 01:40:29 -0700 | [diff] [blame] | 68 | } |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 69 | log.info("Started"); |
| 70 | } |
| 71 | |
| 72 | @Deactivate |
| 73 | public void deactivate() { |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 74 | log.info("Stopped"); |
| 75 | } |
| 76 | |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 77 | /** |
| 78 | * Loads the cluster definition file. |
| 79 | */ |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 80 | private void loadClusterDefinition() { |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 81 | ClusterDefinitionStore cds = new ClusterDefinitionStore("../config/cluster.json"); |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 82 | try { |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 83 | Set<DefaultControllerNode> storedNodes = cds.read(); |
| 84 | for (DefaultControllerNode node : storedNodes) { |
| 85 | nodes.put(node.id(), node); |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 86 | } |
| 87 | } catch (IOException e) { |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 88 | log.error("Unable to read cluster definitions", e); |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 89 | } |
| 90 | } |
| 91 | |
| 92 | /** |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 93 | * Determines who the local controller node is. |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 94 | */ |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 95 | private void establishSelfIdentity() { |
| 96 | // Establishes the controller's own identity. |
| 97 | IpPrefix ip = valueOf(System.getProperty("onos.ip", "127.0.1.1")); |
| 98 | localNode = nodes.get(new NodeId(ip.toString())); |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 99 | |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 100 | // As a fall-back, let's make sure we at least know who we are. |
| 101 | if (localNode == null) { |
| 102 | localNode = new DefaultControllerNode(new NodeId(ip.toString()), ip); |
| 103 | nodes.put(localNode.id(), localNode); |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 104 | } |
tom | 8158314 | 2014-09-30 01:40:29 -0700 | [diff] [blame] | 105 | states.put(localNode.id(), State.ACTIVE); |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 106 | } |
| 107 | |
| 108 | @Override |
| 109 | public ControllerNode getLocalNode() { |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 110 | return localNode; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 111 | } |
| 112 | |
| 113 | @Override |
| 114 | public Set<ControllerNode> getNodes() { |
| 115 | ImmutableSet.Builder<ControllerNode> builder = ImmutableSet.builder(); |
| 116 | return builder.addAll(nodes.values()).build(); |
| 117 | } |
| 118 | |
| 119 | @Override |
| 120 | public ControllerNode getNode(NodeId nodeId) { |
| 121 | return nodes.get(nodeId); |
| 122 | } |
| 123 | |
| 124 | @Override |
| 125 | public State getState(NodeId nodeId) { |
| 126 | State state = states.get(nodeId); |
| 127 | return state == null ? State.INACTIVE : state; |
| 128 | } |
| 129 | |
| 130 | @Override |
| 131 | public ControllerNode addNode(NodeId nodeId, IpPrefix ip, int tcpPort) { |
| 132 | DefaultControllerNode node = new DefaultControllerNode(nodeId, ip, tcpPort); |
| 133 | nodes.put(nodeId, node); |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 134 | clusterCommunicationAdminService.addNode(node); |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 135 | return node; |
| 136 | } |
| 137 | |
| 138 | @Override |
| 139 | public void removeNode(NodeId nodeId) { |
tom | d33e640 | 2014-09-30 03:14:43 -0700 | [diff] [blame] | 140 | if (nodeId.equals(localNode.id())) { |
tom | d33e640 | 2014-09-30 03:14:43 -0700 | [diff] [blame] | 141 | nodes.clear(); |
tom | 28e1fa2 | 2014-09-30 10:38:21 -0700 | [diff] [blame] | 142 | nodes.put(localNode.id(), localNode); |
| 143 | |
tom | d33e640 | 2014-09-30 03:14:43 -0700 | [diff] [blame] | 144 | } else { |
| 145 | // Remove the other node. |
| 146 | DefaultControllerNode node = nodes.remove(nodeId); |
| 147 | if (node != null) { |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 148 | clusterCommunicationAdminService.removeNode(node); |
tom | d33e640 | 2014-09-30 03:14:43 -0700 | [diff] [blame] | 149 | } |
tom | 5a8779c | 2014-09-29 14:48:43 -0700 | [diff] [blame] | 150 | } |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 151 | } |
| 152 | |
tom | 1d416c5 | 2014-09-29 20:55:24 -0700 | [diff] [blame] | 153 | // Entity to handle back calls from the connection manager. |
| 154 | private class InnerNodesDelegate implements ClusterNodesDelegate { |
| 155 | @Override |
tom | 8158314 | 2014-09-30 01:40:29 -0700 | [diff] [blame] | 156 | public DefaultControllerNode nodeDetected(NodeId nodeId, IpPrefix ip, int tcpPort) { |
| 157 | DefaultControllerNode node = nodes.get(nodeId); |
| 158 | if (node == null) { |
| 159 | node = (DefaultControllerNode) addNode(nodeId, ip, tcpPort); |
| 160 | } |
| 161 | states.put(nodeId, State.ACTIVE); |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 162 | livenessCache.put(nodeId, node); |
tom | 8158314 | 2014-09-30 01:40:29 -0700 | [diff] [blame] | 163 | return node; |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 164 | } |
tom | 28e1fa2 | 2014-09-30 10:38:21 -0700 | [diff] [blame] | 165 | |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 166 | @Override |
tom | 8158314 | 2014-09-30 01:40:29 -0700 | [diff] [blame] | 167 | public void nodeVanished(NodeId nodeId) { |
| 168 | states.put(nodeId, State.INACTIVE); |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 169 | } |
tom | d33e640 | 2014-09-30 03:14:43 -0700 | [diff] [blame] | 170 | |
| 171 | @Override |
| 172 | public void nodeRemoved(NodeId nodeId) { |
| 173 | removeNode(nodeId); |
| 174 | } |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 175 | } |
tom | 8158314 | 2014-09-30 01:40:29 -0700 | [diff] [blame] | 176 | |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 177 | private class LivenessCacheRemovalListener implements RemovalListener<NodeId, ControllerNode> { |
| 178 | |
| 179 | @Override |
| 180 | public void onRemoval(RemovalNotification<NodeId, ControllerNode> entry) { |
| 181 | NodeId nodeId = entry.getKey(); |
| 182 | log.warn("Failed to receive heartbeats from controller: " + nodeId); |
| 183 | nodesDelegate.nodeVanished(nodeId); |
| 184 | } |
| 185 | } |
tom | 7309483 | 2014-09-29 13:47:08 -0700 | [diff] [blame] | 186 | } |