blob: 181490e88d70dc74aef657c6f5144e6f18ecbba5 [file] [log] [blame]
Madan Jampani25461112015-02-17 14:17:29 -08001/*
2 * Copyright 2015 Open Networking Laboratory
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
Madan Jampani09342702015-02-05 23:32:40 -080017package org.onosproject.store.consistent.impl;
18
Thomas Vachuska8dc1a692015-03-31 01:01:37 -070019import com.google.common.collect.ImmutableSet;
Madan Jampanif1b8e172015-03-23 11:42:02 -070020import com.google.common.collect.Lists;
Madan Jampanib5d72d52015-04-03 16:53:50 -070021import com.google.common.collect.Maps;
Jonathan Hart054da972015-02-18 17:30:28 -080022import com.google.common.collect.Sets;
Madan Jampani0d03d602015-04-20 12:03:56 -070023import com.google.common.util.concurrent.Futures;
Madan Jampani08706ce2015-04-01 14:49:28 -070024
Madan Jampanif1b8e172015-03-23 11:42:02 -070025import net.kuujo.copycat.CopycatConfig;
Madan Jampani09342702015-02-05 23:32:40 -080026import net.kuujo.copycat.cluster.ClusterConfig;
Jonathan Hart054da972015-02-18 17:30:28 -080027import net.kuujo.copycat.cluster.Member;
Madan Jampanif1b8e172015-03-23 11:42:02 -070028import net.kuujo.copycat.cluster.Member.Type;
29import net.kuujo.copycat.cluster.internal.coordinator.ClusterCoordinator;
30import net.kuujo.copycat.cluster.internal.coordinator.DefaultClusterCoordinator;
31import net.kuujo.copycat.log.BufferedLog;
Madan Jampani09342702015-02-05 23:32:40 -080032import net.kuujo.copycat.log.FileLog;
Madan Jampanif1b8e172015-03-23 11:42:02 -070033import net.kuujo.copycat.log.Log;
Madan Jampani09342702015-02-05 23:32:40 -080034import net.kuujo.copycat.netty.NettyTcpProtocol;
35import net.kuujo.copycat.protocol.Consistency;
Madan Jampanif1b8e172015-03-23 11:42:02 -070036import net.kuujo.copycat.protocol.Protocol;
37import net.kuujo.copycat.util.concurrent.NamedThreadFactory;
Madan Jampani08706ce2015-04-01 14:49:28 -070038
Madan Jampanibff6d8f2015-03-31 16:53:47 -070039import org.apache.commons.lang.math.RandomUtils;
Madan Jampani09342702015-02-05 23:32:40 -080040import org.apache.felix.scr.annotations.Activate;
41import org.apache.felix.scr.annotations.Component;
42import org.apache.felix.scr.annotations.Deactivate;
43import org.apache.felix.scr.annotations.Reference;
44import org.apache.felix.scr.annotations.ReferenceCardinality;
45import org.apache.felix.scr.annotations.Service;
46import org.onosproject.cluster.ClusterService;
Madan Jampanibff6d8f2015-03-31 16:53:47 -070047import org.onosproject.core.IdGenerator;
Madan Jampaniafeebbd2015-05-19 15:26:01 -070048import org.onosproject.store.cluster.impl.ClusterDefinitionManager;
Madan Jampani0cb00672015-02-27 00:27:22 -080049import org.onosproject.store.cluster.impl.NodeInfo;
Jonathan Hart6ec029a2015-03-24 17:12:35 -070050import org.onosproject.store.cluster.messaging.ClusterCommunicationService;
51import org.onosproject.store.ecmap.EventuallyConsistentMapBuilderImpl;
Madan Jampanib5d72d52015-04-03 16:53:50 -070052import org.onosproject.store.service.AtomicCounterBuilder;
Madan Jampanif1b8e172015-03-23 11:42:02 -070053import org.onosproject.store.service.ConsistentMapBuilder;
Madan Jampania89f8f92015-04-01 14:39:54 -070054import org.onosproject.store.service.ConsistentMapException;
Jonathan Hart6ec029a2015-03-24 17:12:35 -070055import org.onosproject.store.service.EventuallyConsistentMapBuilder;
Madan Jampania89f8f92015-04-01 14:39:54 -070056import org.onosproject.store.service.MapInfo;
Jonathan Hart054da972015-02-18 17:30:28 -080057import org.onosproject.store.service.PartitionInfo;
Madan Jampani08706ce2015-04-01 14:49:28 -070058import org.onosproject.store.service.SetBuilder;
Jonathan Hart054da972015-02-18 17:30:28 -080059import org.onosproject.store.service.StorageAdminService;
Madan Jampani393e0f02015-02-12 07:35:39 +053060import org.onosproject.store.service.StorageService;
Madan Jampanibff6d8f2015-03-31 16:53:47 -070061import org.onosproject.store.service.Transaction;
Ayaka Koshibe3a321562015-04-29 13:24:07 -070062import org.onosproject.store.service.TransactionContextBuilder;
Madan Jampani09342702015-02-05 23:32:40 -080063import org.slf4j.Logger;
64
Jonathan Hart054da972015-02-18 17:30:28 -080065import java.io.File;
66import java.io.IOException;
Madan Jampanibff6d8f2015-03-31 16:53:47 -070067import java.util.Collection;
Jonathan Hart054da972015-02-18 17:30:28 -080068import java.util.List;
69import java.util.Map;
70import java.util.Set;
Madan Jampanif1b8e172015-03-23 11:42:02 -070071import java.util.concurrent.CompletableFuture;
Madan Jampania89f8f92015-04-01 14:39:54 -070072import java.util.concurrent.ExecutionException;
Madan Jampanif1b8e172015-03-23 11:42:02 -070073import java.util.concurrent.Executors;
Madan Jampanid14166a2015-02-24 17:37:51 -080074import java.util.concurrent.TimeUnit;
Madan Jampania89f8f92015-04-01 14:39:54 -070075import java.util.concurrent.TimeoutException;
Jonathan Hart054da972015-02-18 17:30:28 -080076import java.util.stream.Collectors;
77
78import static org.slf4j.LoggerFactory.getLogger;
Madan Jampani09342702015-02-05 23:32:40 -080079
80/**
81 * Database manager.
82 */
83@Component(immediate = true, enabled = true)
84@Service
Jonathan Hart054da972015-02-18 17:30:28 -080085public class DatabaseManager implements StorageService, StorageAdminService {
Madan Jampani09342702015-02-05 23:32:40 -080086
87 private final Logger log = getLogger(getClass());
Thomas Vachuskade563cf2015-04-01 00:28:50 -070088
89 public static final int COPYCAT_TCP_PORT = 7238; // 7238 = RAFT
90 public static final String PARTITION_DEFINITION_FILE = "../config/tablets.json";
91 public static final String BASE_PARTITION_NAME = "p0";
92
Madan Jampani1a4eca02015-04-02 15:29:26 -070093 private static final int RAFT_ELECTION_TIMEOUT_MILLIS = 3000;
Madan Jampania89f8f92015-04-01 14:39:54 -070094 private static final int DATABASE_OPERATION_TIMEOUT_MILLIS = 5000;
Thomas Vachuskade563cf2015-04-01 00:28:50 -070095
Madan Jampanif1b8e172015-03-23 11:42:02 -070096 private ClusterCoordinator coordinator;
Madan Jampani09342702015-02-05 23:32:40 -080097 private PartitionedDatabase partitionedDatabase;
Madan Jampanif1b8e172015-03-23 11:42:02 -070098 private Database inMemoryDatabase;
Madan Jampanife3a9a72015-03-13 16:32:26 -070099
Madan Jampanibff6d8f2015-03-31 16:53:47 -0700100 private TransactionManager transactionManager;
101 private final IdGenerator transactionIdGenerator = () -> RandomUtils.nextLong();
102
Madan Jampani09342702015-02-05 23:32:40 -0800103 @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY)
104 protected ClusterService clusterService;
105
Jonathan Hart6ec029a2015-03-24 17:12:35 -0700106 @Reference(cardinality = ReferenceCardinality.MANDATORY_UNARY)
107 protected ClusterCommunicationService clusterCommunicator;
108
Madan Jampani0cb00672015-02-27 00:27:22 -0800109 protected String nodeToUri(NodeInfo node) {
Madan Jampani27b69c62015-05-15 15:49:02 -0700110 return String.format("onos://%s:%d", node.getIp(), node.getTcpPort());
Madan Jampani09342702015-02-05 23:32:40 -0800111 }
112
113 @Activate
114 public void activate() {
Madan Jampani09342702015-02-05 23:32:40 -0800115 // load database configuration
Thomas Vachuskade563cf2015-04-01 00:28:50 -0700116 File databaseDefFile = new File(PARTITION_DEFINITION_FILE);
117 log.info("Loading database definition: {}", databaseDefFile.getAbsolutePath());
Madan Jampani09342702015-02-05 23:32:40 -0800118
Madan Jampani0cb00672015-02-27 00:27:22 -0800119 Map<String, Set<NodeInfo>> partitionMap;
Madan Jampani09342702015-02-05 23:32:40 -0800120 try {
Thomas Vachuskade563cf2015-04-01 00:28:50 -0700121 DatabaseDefinitionStore databaseDefStore = new DatabaseDefinitionStore(databaseDefFile);
122 if (!databaseDefFile.exists()) {
Thomas Vachuska8dc1a692015-03-31 01:01:37 -0700123 createDefaultDatabaseDefinition(databaseDefStore);
124 }
125 partitionMap = databaseDefStore.read().getPartitions();
Madan Jampani09342702015-02-05 23:32:40 -0800126 } catch (IOException e) {
Madan Jampani09342702015-02-05 23:32:40 -0800127 throw new IllegalStateException("Failed to load database config", e);
128 }
129
130 String[] activeNodeUris = partitionMap.values()
131 .stream()
132 .reduce((s1, s2) -> Sets.union(s1, s2))
133 .get()
134 .stream()
135 .map(this::nodeToUri)
136 .toArray(String[]::new);
137
Madan Jampani0cb00672015-02-27 00:27:22 -0800138 String localNodeUri = nodeToUri(NodeInfo.of(clusterService.getLocalNode()));
Madan Jampani27b69c62015-05-15 15:49:02 -0700139 Protocol protocol = new CopycatCommunicationProtocol(clusterService, clusterCommunicator);
Madan Jampani09342702015-02-05 23:32:40 -0800140
141 ClusterConfig clusterConfig = new ClusterConfig()
Madan Jampani27b69c62015-05-15 15:49:02 -0700142 .withProtocol(protocol)
Madan Jampani1a4eca02015-04-02 15:29:26 -0700143 .withElectionTimeout(electionTimeoutMillis(activeNodeUris))
144 .withHeartbeatInterval(heartbeatTimeoutMillis(activeNodeUris))
Madan Jampani09342702015-02-05 23:32:40 -0800145 .withMembers(activeNodeUris)
146 .withLocalMember(localNodeUri);
147
Madan Jampanif1b8e172015-03-23 11:42:02 -0700148 CopycatConfig copycatConfig = new CopycatConfig()
149 .withName("onos")
150 .withClusterConfig(clusterConfig)
151 .withDefaultSerializer(new DatabaseSerializer())
152 .withDefaultExecutor(Executors.newSingleThreadExecutor(new NamedThreadFactory("copycat-coordinator-%d")));
Madan Jampani09342702015-02-05 23:32:40 -0800153
Madan Jampanif1b8e172015-03-23 11:42:02 -0700154 coordinator = new DefaultClusterCoordinator(copycatConfig.resolve());
155
156 DatabaseConfig inMemoryDatabaseConfig =
157 newDatabaseConfig(BASE_PARTITION_NAME, newInMemoryLog(), activeNodeUris);
158 inMemoryDatabase = coordinator
159 .getResource(inMemoryDatabaseConfig.getName(), inMemoryDatabaseConfig.resolve(clusterConfig)
160 .withSerializer(copycatConfig.getDefaultSerializer())
161 .withDefaultExecutor(copycatConfig.getDefaultExecutor()));
162
163 List<Database> partitions = partitionMap.entrySet()
164 .stream()
165 .map(entry -> {
166 String[] replicas = entry.getValue().stream().map(this::nodeToUri).toArray(String[]::new);
167 return newDatabaseConfig(entry.getKey(), newPersistentLog(), replicas);
168 })
169 .map(config -> {
170 Database db = coordinator.getResource(config.getName(), config.resolve(clusterConfig)
171 .withSerializer(copycatConfig.getDefaultSerializer())
172 .withDefaultExecutor(copycatConfig.getDefaultExecutor()));
173 return db;
174 })
175 .collect(Collectors.toList());
176
177 partitionedDatabase = new PartitionedDatabase("onos-store", partitions);
Madan Jampani09342702015-02-05 23:32:40 -0800178
Madan Jampani0d03d602015-04-20 12:03:56 -0700179 CompletableFuture<Void> status = coordinator.open()
Madan Jampanif1b8e172015-03-23 11:42:02 -0700180 .thenCompose(v -> CompletableFuture.allOf(inMemoryDatabase.open(), partitionedDatabase.open())
181 .whenComplete((db, error) -> {
182 if (error != null) {
Madan Jampani0d03d602015-04-20 12:03:56 -0700183 log.error("Failed to initialize database.", error);
Madan Jampanif1b8e172015-03-23 11:42:02 -0700184 } else {
Madan Jampani0d03d602015-04-20 12:03:56 -0700185 log.info("Successfully initialized database.");
Madan Jampanif1b8e172015-03-23 11:42:02 -0700186 }
187 }));
188
Madan Jampani0d03d602015-04-20 12:03:56 -0700189 Futures.getUnchecked(status);
190
Madan Jampanibff6d8f2015-03-31 16:53:47 -0700191 transactionManager = new TransactionManager(partitionedDatabase);
Madan Jampani09342702015-02-05 23:32:40 -0800192 log.info("Started");
193 }
194
Thomas Vachuska8dc1a692015-03-31 01:01:37 -0700195 private void createDefaultDatabaseDefinition(DatabaseDefinitionStore store) {
196 // Assumes IPv4 is returned.
Madan Jampaniafeebbd2015-05-19 15:26:01 -0700197 String ip = ClusterDefinitionManager.getSiteLocalAddress();
Thomas Vachuskade563cf2015-04-01 00:28:50 -0700198 NodeInfo node = NodeInfo.from(ip, ip, COPYCAT_TCP_PORT);
Thomas Vachuska8dc1a692015-03-31 01:01:37 -0700199 try {
Thomas Vachuskade563cf2015-04-01 00:28:50 -0700200 store.write(DatabaseDefinition.from(ImmutableSet.of(node)));
Thomas Vachuska8dc1a692015-03-31 01:01:37 -0700201 } catch (IOException e) {
202 log.warn("Unable to write default cluster definition", e);
203 }
204 }
205
Madan Jampani09342702015-02-05 23:32:40 -0800206 @Deactivate
207 public void deactivate() {
Madan Jampanif1b8e172015-03-23 11:42:02 -0700208 CompletableFuture.allOf(inMemoryDatabase.close(), partitionedDatabase.close())
209 .thenCompose(v -> coordinator.close())
210 .whenComplete((result, error) -> {
211 if (error != null) {
212 log.warn("Failed to cleanly close databases.", error);
213 } else {
214 log.info("Successfully closed databases.");
215 }
216 });
Madan Jampani09342702015-02-05 23:32:40 -0800217 log.info("Stopped");
218 }
219
220 @Override
Ayaka Koshibe3a321562015-04-29 13:24:07 -0700221 public TransactionContextBuilder transactionContextBuilder() {
222 return new DefaultTransactionContextBuilder(
223 inMemoryDatabase, partitionedDatabase, transactionIdGenerator.getNewId());
Madan Jampani64689552015-02-17 10:00:27 -0800224 }
Jonathan Hart054da972015-02-18 17:30:28 -0800225
226 @Override
227 public List<PartitionInfo> getPartitionInfo() {
Madan Jampanif1b8e172015-03-23 11:42:02 -0700228 return Lists.asList(
229 inMemoryDatabase,
230 partitionedDatabase.getPartitions().toArray(new Database[]{}))
Jonathan Hart054da972015-02-18 17:30:28 -0800231 .stream()
Madan Jampanif1b8e172015-03-23 11:42:02 -0700232 .map(DatabaseManager::toPartitionInfo)
Jonathan Hart054da972015-02-18 17:30:28 -0800233 .collect(Collectors.toList());
234 }
235
Madan Jampani27b69c62015-05-15 15:49:02 -0700236 @SuppressWarnings("unused")
Madan Jampanif1b8e172015-03-23 11:42:02 -0700237 private Protocol newNettyProtocol() {
238 return new NettyTcpProtocol()
239 .withSsl(false)
240 .withConnectTimeout(60000)
241 .withAcceptBacklog(1024)
242 .withTrafficClass(-1)
243 .withSoLinger(-1)
244 .withReceiveBufferSize(32768)
245 .withSendBufferSize(8192)
246 .withThreads(1);
247 }
248
249 private Log newPersistentLog() {
250 String logDir = System.getProperty("karaf.data", "./data");
251 return new FileLog()
252 .withDirectory(logDir)
253 .withSegmentSize(1073741824) // 1GB
254 .withFlushOnWrite(true)
255 .withSegmentInterval(Long.MAX_VALUE);
256 }
257
258 private Log newInMemoryLog() {
259 return new BufferedLog()
260 .withFlushOnWrite(false)
261 .withFlushInterval(Long.MAX_VALUE)
262 .withSegmentSize(10485760) // 10MB
263 .withSegmentInterval(Long.MAX_VALUE);
264 }
265
266 private DatabaseConfig newDatabaseConfig(String name, Log log, String[] replicas) {
267 return new DatabaseConfig()
268 .withName(name)
Madan Jampani1a4eca02015-04-02 15:29:26 -0700269 .withElectionTimeout(electionTimeoutMillis(replicas))
270 .withHeartbeatInterval(heartbeatTimeoutMillis(replicas))
Madan Jampanif1b8e172015-03-23 11:42:02 -0700271 .withConsistency(Consistency.STRONG)
272 .withLog(log)
273 .withDefaultSerializer(new DatabaseSerializer())
274 .withReplicas(replicas);
275 }
276
Madan Jampani1a4eca02015-04-02 15:29:26 -0700277 private long electionTimeoutMillis(String[] replicas) {
278 return replicas.length == 1 ? 10L : RAFT_ELECTION_TIMEOUT_MILLIS;
279 }
280
281 private long heartbeatTimeoutMillis(String[] replicas) {
282 return electionTimeoutMillis(replicas) / 2;
283 }
284
Jonathan Hart054da972015-02-18 17:30:28 -0800285 /**
286 * Maps a Raft Database object to a PartitionInfo object.
287 *
288 * @param database database containing input data
289 * @return PartitionInfo object
290 */
Madan Jampanif1b8e172015-03-23 11:42:02 -0700291 private static PartitionInfo toPartitionInfo(Database database) {
Jonathan Hart054da972015-02-18 17:30:28 -0800292 return new PartitionInfo(database.name(),
293 database.cluster().term(),
Madan Jampanif1b8e172015-03-23 11:42:02 -0700294 database.cluster().members()
295 .stream()
296 .filter(member -> Type.ACTIVE.equals(member.type()))
Jonathan Hart054da972015-02-18 17:30:28 -0800297 .map(Member::uri)
Madan Jampanif1b8e172015-03-23 11:42:02 -0700298 .sorted()
Jonathan Hart054da972015-02-18 17:30:28 -0800299 .collect(Collectors.toList()),
300 database.cluster().leader() != null ?
301 database.cluster().leader().uri() : null);
302 }
Jonathan Hart6ec029a2015-03-24 17:12:35 -0700303
304
305 @Override
306 public <K, V> EventuallyConsistentMapBuilder<K, V> eventuallyConsistentMapBuilder() {
307 return new EventuallyConsistentMapBuilderImpl<>(clusterService,
308 clusterCommunicator);
309 }
310
Madan Jampanif1b8e172015-03-23 11:42:02 -0700311 @Override
312 public <K, V> ConsistentMapBuilder<K, V> consistentMapBuilder() {
313 return new DefaultConsistentMapBuilder<>(inMemoryDatabase, partitionedDatabase);
314 }
Madan Jampania89f8f92015-04-01 14:39:54 -0700315
316 @Override
Madan Jampani08706ce2015-04-01 14:49:28 -0700317 public <E> SetBuilder<E> setBuilder() {
318 return new DefaultSetBuilder<>(partitionedDatabase);
319 }
320
321 @Override
Madan Jampanib5d72d52015-04-03 16:53:50 -0700322 public AtomicCounterBuilder atomicCounterBuilder() {
323 return new DefaultAtomicCounterBuilder(inMemoryDatabase, partitionedDatabase);
324 }
325
326 @Override
Madan Jampania89f8f92015-04-01 14:39:54 -0700327 public List<MapInfo> getMapInfo() {
328 List<MapInfo> maps = Lists.newArrayList();
329 maps.addAll(getMapInfo(inMemoryDatabase));
330 maps.addAll(getMapInfo(partitionedDatabase));
331 return maps;
332 }
333
334 private List<MapInfo> getMapInfo(Database database) {
335 return complete(database.tableNames())
336 .stream()
337 .map(name -> new MapInfo(name, complete(database.size(name))))
338 .filter(info -> info.size() > 0)
339 .collect(Collectors.toList());
340 }
341
Madan Jampanib5d72d52015-04-03 16:53:50 -0700342
343 @Override
344 public Map<String, Long> getCounters() {
345 Map<String, Long> counters = Maps.newHashMap();
346 counters.putAll(complete(inMemoryDatabase.counters()));
347 counters.putAll(complete(partitionedDatabase.counters()));
348 return counters;
349 }
350
Madan Jampanibff6d8f2015-03-31 16:53:47 -0700351 @Override
Kaouther Abrouguid8b565a2015-05-20 16:07:20 -0700352 public Map<String, Long> getPartitionedDatabaseCounters() {
353 Map<String, Long> counters = Maps.newHashMap();
354 counters.putAll(complete(partitionedDatabase.counters()));
355 return counters;
356 }
357
358 @Override
359 public Map<String, Long> getInMemoryDatabaseCounters() {
360 Map<String, Long> counters = Maps.newHashMap();
361 counters.putAll(complete(inMemoryDatabase.counters()));
362 return counters;
363 }
364
365 @Override
Madan Jampanibff6d8f2015-03-31 16:53:47 -0700366 public Collection<Transaction> getTransactions() {
367 return complete(transactionManager.getTransactions());
368 }
369
Madan Jampania89f8f92015-04-01 14:39:54 -0700370 private static <T> T complete(CompletableFuture<T> future) {
371 try {
372 return future.get(DATABASE_OPERATION_TIMEOUT_MILLIS, TimeUnit.MILLISECONDS);
373 } catch (InterruptedException e) {
374 Thread.currentThread().interrupt();
375 throw new ConsistentMapException.Interrupted();
376 } catch (TimeoutException e) {
377 throw new ConsistentMapException.Timeout();
378 } catch (ExecutionException e) {
379 throw new ConsistentMapException(e.getCause());
380 }
381 }
Madan Jampanibff6d8f2015-03-31 16:53:47 -0700382
383 @Override
384 public void redriveTransactions() {
385 getTransactions().stream().forEach(transactionManager::execute);
386 }
Madan Jampanib5d72d52015-04-03 16:53:50 -0700387}