Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 1 | package org.onlab.onos.store.cluster.messaging.impl; |
| 2 | |
| 3 | import static com.google.common.base.Preconditions.checkArgument; |
| 4 | |
| 5 | import java.io.IOException; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 6 | import java.util.Set; |
| 7 | import java.util.Timer; |
| 8 | import java.util.TimerTask; |
Yuta HIGUCHI | 38bd145 | 2014-10-07 17:37:25 -0700 | [diff] [blame] | 9 | import java.util.concurrent.TimeUnit; |
| 10 | import java.util.concurrent.TimeoutException; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 11 | |
| 12 | import org.apache.felix.scr.annotations.Activate; |
| 13 | import org.apache.felix.scr.annotations.Component; |
| 14 | import org.apache.felix.scr.annotations.Deactivate; |
Madan Jampani | a5d0d78 | 2014-10-07 14:36:00 -0700 | [diff] [blame] | 15 | import org.apache.felix.scr.annotations.Reference; |
| 16 | import org.apache.felix.scr.annotations.ReferenceCardinality; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 17 | import org.apache.felix.scr.annotations.Service; |
Madan Jampani | a5d0d78 | 2014-10-07 14:36:00 -0700 | [diff] [blame] | 18 | import org.onlab.onos.cluster.ClusterService; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 19 | import org.onlab.onos.cluster.ControllerNode; |
| 20 | import org.onlab.onos.cluster.NodeId; |
Yuta HIGUCHI | c057c63 | 2014-10-06 18:38:14 -0700 | [diff] [blame] | 21 | import org.onlab.onos.store.cluster.impl.ClusterMembershipEvent; |
| 22 | import org.onlab.onos.store.cluster.impl.ClusterMembershipEventType; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 23 | import org.onlab.onos.store.cluster.impl.ClusterNodesDelegate; |
| 24 | import org.onlab.onos.store.cluster.messaging.ClusterCommunicationAdminService; |
| 25 | import org.onlab.onos.store.cluster.messaging.ClusterCommunicationService; |
| 26 | import org.onlab.onos.store.cluster.messaging.ClusterMessage; |
| 27 | import org.onlab.onos.store.cluster.messaging.ClusterMessageHandler; |
| 28 | import org.onlab.onos.store.cluster.messaging.MessageSubject; |
Yuta HIGUCHI | 7a8d4aa | 2014-10-07 17:37:11 -0700 | [diff] [blame] | 29 | import org.onlab.onos.store.serializers.ClusterMessageSerializer; |
Madan Jampani | 53e44e6 | 2014-10-07 12:39:51 -0700 | [diff] [blame] | 30 | import org.onlab.onos.store.serializers.KryoPoolUtil; |
| 31 | import org.onlab.onos.store.serializers.KryoSerializer; |
| 32 | import org.onlab.util.KryoPool; |
Madan Jampani | c9ed9be | 2014-10-02 16:13:11 -0700 | [diff] [blame] | 33 | import org.onlab.netty.Endpoint; |
| 34 | import org.onlab.netty.Message; |
| 35 | import org.onlab.netty.MessageHandler; |
| 36 | import org.onlab.netty.MessagingService; |
Madan Jampani | da1a6b0 | 2014-10-07 14:16:15 -0700 | [diff] [blame] | 37 | import org.onlab.netty.NettyMessagingService; |
Yuta HIGUCHI | 38bd145 | 2014-10-07 17:37:25 -0700 | [diff] [blame] | 38 | import org.onlab.netty.Response; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 39 | import org.slf4j.Logger; |
| 40 | import org.slf4j.LoggerFactory; |
| 41 | |
| 42 | @Component(immediate = true) |
| 43 | @Service |
Madan Jampani | 3b0dfd5 | 2014-10-02 16:48:13 -0700 | [diff] [blame] | 44 | public class ClusterCommunicationManager |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 45 | implements ClusterCommunicationService, ClusterCommunicationAdminService { |
| 46 | |
| 47 | private final Logger log = LoggerFactory.getLogger(getClass()); |
| 48 | |
| 49 | private ControllerNode localNode; |
Madan Jampani | a5d0d78 | 2014-10-07 14:36:00 -0700 | [diff] [blame] | 50 | |
| 51 | @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY) |
| 52 | private ClusterService clusterService; |
| 53 | |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 54 | private ClusterNodesDelegate nodesDelegate; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 55 | private final Timer timer = new Timer("onos-controller-heatbeats"); |
| 56 | public static final long HEART_BEAT_INTERVAL_MILLIS = 1000L; |
| 57 | |
Yuta HIGUCHI | 993d7aa | 2014-10-06 22:54:38 -0700 | [diff] [blame] | 58 | // TODO: This probably should not be a OSGi service. |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 59 | private MessagingService messagingService; |
| 60 | |
Madan Jampani | 53e44e6 | 2014-10-07 12:39:51 -0700 | [diff] [blame] | 61 | private static final KryoSerializer SERIALIZER = new KryoSerializer() { |
Yuta HIGUCHI | 7a8d4aa | 2014-10-07 17:37:11 -0700 | [diff] [blame] | 62 | @Override |
Madan Jampani | 53e44e6 | 2014-10-07 12:39:51 -0700 | [diff] [blame] | 63 | protected void setupKryoPool() { |
| 64 | serializerPool = KryoPool.newBuilder() |
| 65 | .register(KryoPoolUtil.API) |
Yuta HIGUCHI | 7a8d4aa | 2014-10-07 17:37:11 -0700 | [diff] [blame] | 66 | .register(ClusterMessage.class, new ClusterMessageSerializer()) |
Madan Jampani | 53e44e6 | 2014-10-07 12:39:51 -0700 | [diff] [blame] | 67 | .register(ClusterMembershipEvent.class) |
Yuta HIGUCHI | 7a8d4aa | 2014-10-07 17:37:11 -0700 | [diff] [blame] | 68 | .register(byte[].class) |
| 69 | .register(MessageSubject.class) |
Madan Jampani | 53e44e6 | 2014-10-07 12:39:51 -0700 | [diff] [blame] | 70 | .build() |
| 71 | .populate(1); |
| 72 | } |
| 73 | |
| 74 | }; |
| 75 | |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 76 | @Activate |
| 77 | public void activate() { |
Madan Jampani | a5d0d78 | 2014-10-07 14:36:00 -0700 | [diff] [blame] | 78 | localNode = clusterService.getLocalNode(); |
Yuta HIGUCHI | 7a8d4aa | 2014-10-07 17:37:11 -0700 | [diff] [blame] | 79 | NettyMessagingService netty = new NettyMessagingService(localNode.tcpPort()); |
| 80 | // FIXME: workaround until it becomes a service. |
| 81 | try { |
| 82 | netty.activate(); |
| 83 | } catch (Exception e) { |
| 84 | // TODO Auto-generated catch block |
| 85 | log.error("NettyMessagingService#activate", e); |
| 86 | } |
| 87 | messagingService = netty; |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 88 | log.info("Started"); |
| 89 | } |
| 90 | |
| 91 | @Deactivate |
| 92 | public void deactivate() { |
Yuta HIGUCHI | 993d7aa | 2014-10-06 22:54:38 -0700 | [diff] [blame] | 93 | // TODO: cleanup messageingService if needed. |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 94 | log.info("Stopped"); |
| 95 | } |
| 96 | |
| 97 | @Override |
| 98 | public boolean broadcast(ClusterMessage message) { |
| 99 | boolean ok = true; |
Yuta HIGUCHI | 7a8d4aa | 2014-10-07 17:37:11 -0700 | [diff] [blame] | 100 | for (ControllerNode node : clusterService.getNodes()) { |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 101 | if (!node.equals(localNode)) { |
| 102 | ok = unicast(message, node.id()) && ok; |
| 103 | } |
| 104 | } |
| 105 | return ok; |
| 106 | } |
| 107 | |
| 108 | @Override |
| 109 | public boolean multicast(ClusterMessage message, Set<NodeId> nodes) { |
| 110 | boolean ok = true; |
| 111 | for (NodeId nodeId : nodes) { |
| 112 | if (!nodeId.equals(localNode.id())) { |
| 113 | ok = unicast(message, nodeId) && ok; |
| 114 | } |
| 115 | } |
| 116 | return ok; |
| 117 | } |
| 118 | |
| 119 | @Override |
| 120 | public boolean unicast(ClusterMessage message, NodeId toNodeId) { |
Yuta HIGUCHI | 7a8d4aa | 2014-10-07 17:37:11 -0700 | [diff] [blame] | 121 | ControllerNode node = clusterService.getNode(toNodeId); |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 122 | checkArgument(node != null, "Unknown nodeId: %s", toNodeId); |
| 123 | Endpoint nodeEp = new Endpoint(node.ip().toString(), node.tcpPort()); |
| 124 | try { |
Yuta HIGUCHI | 38bd145 | 2014-10-07 17:37:25 -0700 | [diff] [blame] | 125 | log.info("sending..."); |
| 126 | Response resp = messagingService.sendAndReceive(nodeEp, message.subject().value(), SERIALIZER.encode(message)); |
| 127 | resp.get(1, TimeUnit.SECONDS); |
| 128 | log.info("sent..."); |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 129 | return true; |
Yuta HIGUCHI | 38bd145 | 2014-10-07 17:37:25 -0700 | [diff] [blame] | 130 | } catch (IOException | TimeoutException e) { |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 131 | log.error("Failed to send cluster message to nodeId: " + toNodeId, e); |
| 132 | } |
| 133 | |
| 134 | return false; |
| 135 | } |
| 136 | |
| 137 | @Override |
| 138 | public void addSubscriber(MessageSubject subject, |
| 139 | ClusterMessageHandler subscriber) { |
| 140 | messagingService.registerHandler(subject.value(), new InternalClusterMessageHandler(subscriber)); |
| 141 | } |
| 142 | |
| 143 | @Override |
| 144 | public void initialize(ControllerNode localNode, |
| 145 | ClusterNodesDelegate delegate) { |
| 146 | this.localNode = localNode; |
| 147 | this.nodesDelegate = delegate; |
| 148 | this.addSubscriber(new MessageSubject("CLUSTER_MEMBERSHIP_EVENT"), new ClusterMemebershipEventHandler()); |
| 149 | timer.schedule(new KeepAlive(), 0, HEART_BEAT_INTERVAL_MILLIS); |
| 150 | } |
| 151 | |
| 152 | @Override |
| 153 | public void addNode(ControllerNode node) { |
Yuta HIGUCHI | 7a8d4aa | 2014-10-07 17:37:11 -0700 | [diff] [blame] | 154 | //members.put(node.id(), node); |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 155 | } |
| 156 | |
| 157 | @Override |
| 158 | public void removeNode(ControllerNode node) { |
| 159 | broadcast(new ClusterMessage( |
| 160 | localNode.id(), |
| 161 | new MessageSubject("CLUSTER_MEMBERSHIP_EVENT"), |
Madan Jampani | 53e44e6 | 2014-10-07 12:39:51 -0700 | [diff] [blame] | 162 | SERIALIZER.encode(new ClusterMembershipEvent(ClusterMembershipEventType.LEAVING_MEMBER, node)))); |
Yuta HIGUCHI | 7a8d4aa | 2014-10-07 17:37:11 -0700 | [diff] [blame] | 163 | //members.remove(node.id()); |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 164 | } |
| 165 | |
| 166 | // Sends a heart beat to all peers. |
| 167 | private class KeepAlive extends TimerTask { |
| 168 | |
| 169 | @Override |
| 170 | public void run() { |
| 171 | broadcast(new ClusterMessage( |
| 172 | localNode.id(), |
| 173 | new MessageSubject("CLUSTER_MEMBERSHIP_EVENT"), |
Madan Jampani | 53e44e6 | 2014-10-07 12:39:51 -0700 | [diff] [blame] | 174 | SERIALIZER.encode(new ClusterMembershipEvent(ClusterMembershipEventType.HEART_BEAT, localNode)))); |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 175 | } |
| 176 | } |
| 177 | |
| 178 | private class ClusterMemebershipEventHandler implements ClusterMessageHandler { |
| 179 | |
| 180 | @Override |
| 181 | public void handle(ClusterMessage message) { |
| 182 | |
Madan Jampani | 53e44e6 | 2014-10-07 12:39:51 -0700 | [diff] [blame] | 183 | ClusterMembershipEvent event = SERIALIZER.decode(message.payload()); |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 184 | ControllerNode node = event.node(); |
| 185 | if (event.type() == ClusterMembershipEventType.HEART_BEAT) { |
| 186 | log.info("Node {} sent a hearbeat", node.id()); |
| 187 | nodesDelegate.nodeDetected(node.id(), node.ip(), node.tcpPort()); |
| 188 | } else if (event.type() == ClusterMembershipEventType.LEAVING_MEMBER) { |
| 189 | log.info("Node {} is leaving", node.id()); |
| 190 | nodesDelegate.nodeRemoved(node.id()); |
| 191 | } else if (event.type() == ClusterMembershipEventType.UNREACHABLE_MEMBER) { |
| 192 | log.info("Node {} is unreachable", node.id()); |
| 193 | nodesDelegate.nodeVanished(node.id()); |
| 194 | } |
| 195 | } |
| 196 | } |
| 197 | |
Yuta HIGUCHI | 38bd145 | 2014-10-07 17:37:25 -0700 | [diff] [blame] | 198 | // FIXME: revert static |
| 199 | private class InternalClusterMessageHandler implements MessageHandler { |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 200 | |
| 201 | private final ClusterMessageHandler handler; |
| 202 | |
| 203 | public InternalClusterMessageHandler(ClusterMessageHandler handler) { |
| 204 | this.handler = handler; |
| 205 | } |
| 206 | |
| 207 | @Override |
| 208 | public void handle(Message message) { |
Yuta HIGUCHI | 38bd145 | 2014-10-07 17:37:25 -0700 | [diff] [blame] | 209 | // FIXME: remove me |
| 210 | log.info("InternalClusterMessageHandler.handle({})", message); |
| 211 | try { |
| 212 | log.info("before decode"); |
| 213 | ClusterMessage clusterMessage = SERIALIZER.decode(message.payload()); |
| 214 | log.info("Subject:({}), Sender:({})", clusterMessage.subject(), clusterMessage.sender()); |
| 215 | handler.handle(clusterMessage); |
| 216 | message.respond("ACK".getBytes()); |
| 217 | } catch (Exception e) { |
| 218 | // TODO Auto-generated catch block |
| 219 | log.error("failed", e); |
| 220 | } |
Madan Jampani | 890bc35 | 2014-10-01 22:35:29 -0700 | [diff] [blame] | 221 | } |
| 222 | } |
| 223 | } |