blob: 36475b8879167f9627507157fc08f4c13673042f [file] [log] [blame]
Jonathan Hart74c83132015-02-02 18:37:57 -08001/*
2 * Copyright 2015 Open Networking Laboratory
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16package org.onosproject.store.intent.impl;
17
18import org.apache.felix.scr.annotations.Activate;
19import org.apache.felix.scr.annotations.Component;
20import org.apache.felix.scr.annotations.Deactivate;
21import org.apache.felix.scr.annotations.Reference;
22import org.apache.felix.scr.annotations.ReferenceCardinality;
23import org.apache.felix.scr.annotations.Service;
Jonathan Hartf2fda812015-02-17 15:21:03 -080024import org.onosproject.cluster.ClusterEvent;
25import org.onosproject.cluster.ClusterEventListener;
Jonathan Hart74c83132015-02-02 18:37:57 -080026import org.onosproject.cluster.ClusterService;
Jonathan Hartf2fda812015-02-17 15:21:03 -080027import org.onosproject.cluster.ControllerNode;
Jonathan Hart74c83132015-02-02 18:37:57 -080028import org.onosproject.cluster.Leadership;
29import org.onosproject.cluster.LeadershipEvent;
30import org.onosproject.cluster.LeadershipEventListener;
31import org.onosproject.cluster.LeadershipService;
Brian O'Connor5eb77c82015-03-02 18:09:39 -080032import org.onosproject.cluster.NodeId;
Jonathan Hart5ec32ba2015-02-05 13:33:58 -080033import org.onosproject.net.intent.Key;
Brian O'Connor87ba7a72015-03-11 14:40:09 -070034import org.onosproject.net.intent.PartitionService;
Jonathan Hart74c83132015-02-02 18:37:57 -080035import org.slf4j.Logger;
36import org.slf4j.LoggerFactory;
37
Jonathan Hartdc9d7b82015-02-22 17:59:50 -080038import java.util.List;
Brian O'Connor5eb77c82015-03-02 18:09:39 -080039import java.util.Objects;
Jonathan Hartf2fda812015-02-17 15:21:03 -080040import java.util.concurrent.Executors;
41import java.util.concurrent.ScheduledExecutorService;
42import java.util.concurrent.TimeUnit;
Jonathan Hartdc9d7b82015-02-22 17:59:50 -080043import java.util.stream.Collectors;
Jonathan Hart74c83132015-02-02 18:37:57 -080044
Jonathan Hart74c83132015-02-02 18:37:57 -080045/**
46 * Manages the assignment of intent keyspace partitions to instances.
47 */
48@Component(immediate = true)
49@Service
50public class PartitionManager implements PartitionService {
51
52 private static final Logger log = LoggerFactory.getLogger(PartitionManager.class);
53
54 @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY)
55 protected LeadershipService leadershipService;
56
57 @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY)
58 protected ClusterService clusterService;
59
Jonathan Hart7061acd2015-03-04 13:15:32 -080060 static final int NUM_PARTITIONS = 14;
Jonathan Hartf2fda812015-02-17 15:21:03 -080061 private static final int BACKOFF_TIME = 2;
62 private static final int CHECK_PERIOD = 10;
Jonathan Hart74c83132015-02-02 18:37:57 -080063
64 private static final String ELECTION_PREFIX = "intent-partition-";
65
66 private LeadershipEventListener leaderListener = new InternalLeadershipListener();
Jonathan Hartf2fda812015-02-17 15:21:03 -080067 private ClusterEventListener clusterListener = new InternalClusterEventListener();
Jonathan Hart74c83132015-02-02 18:37:57 -080068
Jonathan Hartf2fda812015-02-17 15:21:03 -080069 private ScheduledExecutorService executor = Executors
70 .newScheduledThreadPool(1);
Jonathan Hart74c83132015-02-02 18:37:57 -080071
72 @Activate
73 public void activate() {
Jonathan Hart74c83132015-02-02 18:37:57 -080074 leadershipService.addListener(leaderListener);
Jonathan Hartf2fda812015-02-17 15:21:03 -080075 clusterService.addListener(clusterListener);
Jonathan Hart74c83132015-02-02 18:37:57 -080076
77 for (int i = 0; i < NUM_PARTITIONS; i++) {
Jonathan Hartf2fda812015-02-17 15:21:03 -080078 leadershipService.runForLeadership(getPartitionPath(i));
Jonathan Hart74c83132015-02-02 18:37:57 -080079 }
Jonathan Hartf2fda812015-02-17 15:21:03 -080080
81 executor.scheduleAtFixedRate(this::doRelinquish, 0,
82 CHECK_PERIOD, TimeUnit.SECONDS);
Jonathan Hart74c83132015-02-02 18:37:57 -080083 }
84
85 @Deactivate
86 public void deactivate() {
Jonathan Hartac48a952015-02-25 14:11:55 -080087 executor.shutdownNow();
88
Jonathan Hart74c83132015-02-02 18:37:57 -080089 leadershipService.removeListener(leaderListener);
Jonathan Hartf2fda812015-02-17 15:21:03 -080090 clusterService.removeListener(clusterListener);
91 }
92
Jonathan Hart7061acd2015-03-04 13:15:32 -080093 /**
94 * Sets the specified executor to be used for scheduling background tasks.
95 *
96 * @param executor scheduled executor service for background tasks
97 * @return this PartitionManager
98 */
99 public PartitionManager withScheduledExecutor(ScheduledExecutorService executor) {
100 this.executor = executor;
101 return this;
102 }
103
Jonathan Hartf2fda812015-02-17 15:21:03 -0800104 private String getPartitionPath(int i) {
105 return ELECTION_PREFIX + i;
Jonathan Hart74c83132015-02-02 18:37:57 -0800106 }
107
Jonathan Hartdc9d7b82015-02-22 17:59:50 -0800108 private String getPartitionPath(PartitionId id) {
109 return getPartitionPath(id.value());
110 }
111
Jonathan Hart5ec32ba2015-02-05 13:33:58 -0800112 private PartitionId getPartitionForKey(Key intentKey) {
Brian O'Connor1fdfacd2015-02-18 20:52:06 -0800113 int partition = Math.abs((int) intentKey.hash()) % NUM_PARTITIONS;
114 //TODO investigate Guava consistent hash method
115 // ... does it add significant computational complexity? is it worth it?
116 //int partition = consistentHash(intentKey.hash(), NUM_PARTITIONS);
117 PartitionId id = new PartitionId(partition);
118 log.debug("Getting partition for {}: {}", intentKey, id); //FIXME debug
119 return id;
Jonathan Hart74c83132015-02-02 18:37:57 -0800120 }
121
122 @Override
Jonathan Hart5ec32ba2015-02-05 13:33:58 -0800123 public boolean isMine(Key intentKey) {
Brian O'Connor5eb77c82015-03-02 18:09:39 -0800124 return Objects.equals(leadershipService.getLeader(getPartitionPath(getPartitionForKey(intentKey))),
125 clusterService.getLocalNode().id());
126 }
127
128 @Override
129 public NodeId getLeader(Key intentKey) {
130 return leadershipService.getLeader(getPartitionPath(getPartitionForKey(intentKey)));
Jonathan Hart74c83132015-02-02 18:37:57 -0800131 }
132
Jonathan Hartf2fda812015-02-17 15:21:03 -0800133 private void doRelinquish() {
134 try {
135 relinquish();
136 } catch (Exception e) {
137 log.warn("Exception caught during relinquish task", e);
138 }
139 }
140
Jonathan Hartf2fda812015-02-17 15:21:03 -0800141 /**
142 * Determine whether we have more than our fair share of partitions, and if
143 * so, relinquish leadership of some of them for a little while to let
144 * other instances take over.
145 */
146 private void relinquish() {
147 int activeNodes = (int) clusterService.getNodes()
148 .stream()
149 .filter(n -> clusterService.getState(n.id())
150 == ControllerNode.State.ACTIVE)
151 .count();
152
153 int myShare = (int) Math.ceil((double) NUM_PARTITIONS / activeNodes);
154
Jonathan Hartdc9d7b82015-02-22 17:59:50 -0800155 List<Leadership> myPartitions = leadershipService.getLeaderBoard().values()
156 .stream()
157 .filter(l -> clusterService.getLocalNode().id().equals(l.leader()))
158 .filter(l -> l.topic().startsWith(ELECTION_PREFIX))
159 .collect(Collectors.toList());
Jonathan Hartf2fda812015-02-17 15:21:03 -0800160
Jonathan Hartdc9d7b82015-02-22 17:59:50 -0800161 int relinquish = myPartitions.size() - myShare;
Jonathan Hartf2fda812015-02-17 15:21:03 -0800162
Jonathan Hartdc9d7b82015-02-22 17:59:50 -0800163 if (relinquish <= 0) {
164 return;
165 }
Jonathan Hartf2fda812015-02-17 15:21:03 -0800166
Jonathan Hartdc9d7b82015-02-22 17:59:50 -0800167 for (int i = 0; i < relinquish; i++) {
168 String topic = myPartitions.get(i).topic();
169 leadershipService.withdraw(topic);
Jonathan Hartf2fda812015-02-17 15:21:03 -0800170
Jonathan Hartdc9d7b82015-02-22 17:59:50 -0800171 executor.schedule(() -> recontest(topic),
172 BACKOFF_TIME, TimeUnit.SECONDS);
Jonathan Hartf2fda812015-02-17 15:21:03 -0800173 }
174 }
175
176 /**
177 * Try and recontest for leadership of a partition.
178 *
179 * @param path topic name to recontest
180 */
181 private void recontest(String path) {
182 leadershipService.runForLeadership(path);
183 }
184
Jonathan Hart74c83132015-02-02 18:37:57 -0800185 private final class InternalLeadershipListener implements LeadershipEventListener {
186
187 @Override
188 public void event(LeadershipEvent event) {
189 Leadership leadership = event.subject();
Jonathan Hartdc9d7b82015-02-22 17:59:50 -0800190
Brian O'Connor5eb77c82015-03-02 18:09:39 -0800191 if (Objects.equals(leadership.leader(), clusterService.getLocalNode().id()) &&
Jonathan Hart74c83132015-02-02 18:37:57 -0800192 leadership.topic().startsWith(ELECTION_PREFIX)) {
193
Jonathan Hartf2fda812015-02-17 15:21:03 -0800194 // See if we need to let some partitions go
195 relinquish();
Jonathan Hart74c83132015-02-02 18:37:57 -0800196 }
Jonathan Hart74c83132015-02-02 18:37:57 -0800197 }
198 }
Jonathan Hartf2fda812015-02-17 15:21:03 -0800199
200 private final class InternalClusterEventListener implements
201 ClusterEventListener {
202
203 @Override
204 public void event(ClusterEvent event) {
205 relinquish();
206 }
207 }
Jonathan Hart74c83132015-02-02 18:37:57 -0800208}