2 * ============LICENSE_START=======================================================
4 * ================================================================================
5 * Copyright (C) 2018 AT&T Intellectual Property. All rights
7 * ================================================================================
8 * Licensed under the Apache License, Version 2.0 (the "License");
9 * you may not use this file except in compliance with the License.
10 * You may obtain a copy of the License at
12 * http://www.apache.org/licenses/LICENSE-2.0
14 * Unless required by applicable law or agreed to in writing, software
15 * distributed under the License is distributed on an "AS IS" BASIS,
16 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
17 * See the License for the specific language governing permissions and
18 * limitations under the License.
19 * ============LICENSE_END=========================================================
22 package org.onap.ccsdk.sli.plugins.grtoolkit;
24 import java.io.BufferedReader;
26 import java.io.FileInputStream;
27 import java.io.FileReader;
28 import java.io.IOException;
29 import java.io.InputStreamReader;
30 import java.io.OutputStream;
31 import java.net.HttpURLConnection;
33 import java.nio.charset.StandardCharsets;
34 import java.sql.Connection;
35 import java.sql.SQLException;
36 import java.util.ArrayList;
37 import java.util.Collection;
38 import java.util.HashMap;
40 import java.util.Properties;
41 import java.util.List;
42 import java.util.concurrent.ExecutorService;
43 import java.util.concurrent.Executors;
44 import java.util.regex.Matcher;
45 import java.util.regex.Pattern;
46 import javax.annotation.Nonnull;
48 import com.google.common.util.concurrent.Futures;
49 import com.google.common.util.concurrent.ListenableFuture;
51 import org.onap.ccsdk.sli.core.dblib.DBLibConnection;
52 import org.onap.ccsdk.sli.core.dblib.DbLibService;
53 import org.onap.ccsdk.sli.plugins.grtoolkit.data.ClusterActor;
54 import org.onap.ccsdk.sli.plugins.grtoolkit.data.MemberBuilder;
56 import org.json.JSONArray;
57 import org.json.JSONException;
58 import org.json.JSONObject;
60 import org.opendaylight.controller.cluster.datastore.DistributedDataStoreInterface;
61 import org.opendaylight.controller.md.sal.binding.api.DataBroker;
62 import org.opendaylight.controller.md.sal.binding.api.DataTreeChangeListener;
63 import org.opendaylight.controller.md.sal.binding.api.NotificationPublishService;
64 import org.opendaylight.controller.sal.binding.api.BindingAwareBroker;
65 import org.opendaylight.controller.sal.binding.api.RpcProviderRegistry;
66 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.AdminHealthInput;
67 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.AdminHealthOutput;
68 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.AdminHealthOutputBuilder;
69 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ClusterHealthInput;
70 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ClusterHealthOutput;
71 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ClusterHealthOutputBuilder;
72 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.DatabaseHealthInput;
73 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.DatabaseHealthOutput;
74 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.DatabaseHealthOutputBuilder;
75 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.FailoverInput;
76 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.FailoverOutput;
77 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.FailoverOutputBuilder;
78 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.GrToolkitService;
79 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.HaltAkkaTrafficInput;
80 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.HaltAkkaTrafficOutput;
81 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.HaltAkkaTrafficOutputBuilder;
82 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.Member;
83 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ResumeAkkaTrafficInput;
84 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ResumeAkkaTrafficOutput;
85 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ResumeAkkaTrafficOutputBuilder;
86 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.Site;
87 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteHealthInput;
88 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteHealthOutput;
89 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteHealthOutputBuilder;
90 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteIdentifierInput;
91 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteIdentifierOutput;
92 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteIdentifierOutputBuilder;
93 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.site.health.output.SitesBuilder;
94 import org.opendaylight.yangtools.yang.common.RpcResult;
95 import org.opendaylight.yangtools.yang.common.RpcResultBuilder;
97 import org.slf4j.Logger;
98 import org.slf4j.LoggerFactory;
100 public class GrToolkitProvider implements AutoCloseable, GrToolkitService, DataTreeChangeListener {
101 private static final String APP_NAME = "gr-toolkit";
102 private static final String PROPERTIES_FILE = System.getenv("SDNC_CONFIG_DIR") + "/gr-toolkit.properties";
103 private static final String HEALTHY = "HEALTHY";
104 private static final String FAULTY = "FAULTY";
105 private static final String VALUE = "value";
106 private String akkaConfig;
107 private String jolokiaClusterPath;
108 private String shardManagerPath;
109 private String shardPathTemplate;
110 private String credentials;
111 private String httpProtocol;
112 private String siteIdentifier = System.getenv("SITE_NAME");
113 private final Logger log = LoggerFactory.getLogger(GrToolkitProvider.class);
114 private final ExecutorService executor;
115 protected DataBroker dataBroker;
116 protected NotificationPublishService notificationService;
117 protected RpcProviderRegistry rpcRegistry;
118 protected BindingAwareBroker.RpcRegistration<GrToolkitService> rpcRegistration;
119 protected DbLibService dbLib;
120 private String member;
121 private ClusterActor self;
122 private HashMap<String, ClusterActor> memberMap;
123 private SiteConfiguration siteConfiguration;
124 private Properties properties;
125 private DistributedDataStoreInterface configDatastore;
126 public GrToolkitProvider(DataBroker dataBroker,
127 NotificationPublishService notificationProviderService,
128 RpcProviderRegistry rpcProviderRegistry,
129 DistributedDataStoreInterface configDatastore,
130 DbLibService dbLibService) {
131 this.log.info("Creating provider for {}", APP_NAME);
132 this.executor = Executors.newFixedThreadPool(1);
133 this.dataBroker = dataBroker;
134 this.notificationService = notificationProviderService;
135 this.rpcRegistry = rpcProviderRegistry;
136 this.configDatastore = configDatastore;
137 this.dbLib = dbLibService;
141 private void initialize() {
142 log.info("Initializing provider for {}", APP_NAME);
143 // Create the top level containers
148 rpcRegistration = rpcRegistry.addRpcImplementation(GrToolkitService.class, this);
149 log.info("Initialization complete for {}", APP_NAME);
152 private void setProperties() {
153 log.info("Loading properties from {}", PROPERTIES_FILE);
154 properties = new Properties();
155 File propertiesFile = new File(PROPERTIES_FILE);
156 if(!propertiesFile.exists()) {
157 log.warn("Properties file not found.");
160 try(FileInputStream fileInputStream = new FileInputStream(propertiesFile)) {
161 properties.load(fileInputStream);
162 if(!properties.containsKey(PropertyKeys.SITE_IDENTIFIER)) {
163 properties.put(PropertyKeys.SITE_IDENTIFIER, "Unknown Site");
165 String port = "true".equals(properties.getProperty(PropertyKeys.CONTROLLER_USE_SSL).trim()) ? properties.getProperty(PropertyKeys.CONTROLLER_PORT_SSL).trim() : properties.getProperty(PropertyKeys.CONTROLLER_PORT_HTTP).trim();
166 httpProtocol = "true".equals(properties.getProperty(PropertyKeys.CONTROLLER_USE_SSL).trim()) ? "https://" : "http://";
167 akkaConfig = properties.getProperty(PropertyKeys.AKKA_CONF_LOCATION).trim();
168 jolokiaClusterPath = ":" + port + properties.getProperty(PropertyKeys.MBEAN_CLUSTER).trim();
169 shardManagerPath = ":" + port + properties.getProperty(PropertyKeys.MBEAN_SHARD_MANAGER).trim();
170 shardPathTemplate = ":" + port + properties.getProperty(PropertyKeys.MBEAN_SHARD_CONFIG).trim();
171 if(siteIdentifier == null || siteIdentifier.isEmpty()) {
172 siteIdentifier = properties.getProperty(PropertyKeys.SITE_IDENTIFIER).trim();
174 credentials = properties.getProperty(PropertyKeys.CONTROLLER_CREDENTIALS).trim();
175 log.info("Loaded properties.");
176 } catch(IOException e) {
177 log.error("Error loading properties.", e);
181 private void defineMembers() {
182 member = configDatastore.getActorContext().getCurrentMemberName().getName();
183 log.info("Cluster member: {}", member);
185 log.info("Parsing akka.conf for cluster memberMap...");
187 File akkaConfigFile = new File(this.akkaConfig);
188 try(FileReader fileReader = new FileReader(akkaConfigFile);
189 BufferedReader bufferedReader = new BufferedReader(fileReader)) {
191 while((line = bufferedReader.readLine()) != null) {
192 if(line.contains("seed-nodes =")) {
193 parseSeedNodes(line);
198 } catch(IOException e) {
199 log.error("Couldn't load akka", e);
200 } catch(NullPointerException e) {
201 log.error("akkaConfig is null. Check properties file and restart {} bundle.", APP_NAME);
203 log.info("self:\n{}", self);
206 private void createContainers() {
207 // Replace with MD-SAL write for FailoverStatus
210 protected void initializeChild() {
211 // Override if you have custom initialization intelligence
215 public void close() throws Exception {
216 log.info("Closing provider for {}", APP_NAME);
218 rpcRegistration.close();
219 log.info("Successfully closed provider for {}", APP_NAME);
223 public void onDataTreeChanged(@Nonnull Collection changes) {
224 log.info("onDataTreeChanged() called. but there is no change here");
228 public ListenableFuture<RpcResult<ClusterHealthOutput>> clusterHealth(ClusterHealthInput input) {
229 log.info("{}:cluster-health invoked.", APP_NAME);
230 getControllerHealth();
231 return buildClusterHealthOutput("200");
235 public ListenableFuture<RpcResult<SiteHealthOutput>> siteHealth(SiteHealthInput input) {
236 log.info("{}:site-health invoked.", APP_NAME);
237 getControllerHealth();
238 return buildSiteHealthOutput("200", getAdminHealth(), getDatabaseHealth());
242 public ListenableFuture<RpcResult<DatabaseHealthOutput>> databaseHealth(DatabaseHealthInput input) {
243 log.info("{}:database-health invoked.", APP_NAME);
244 DatabaseHealthOutputBuilder outputBuilder = new DatabaseHealthOutputBuilder();
245 outputBuilder.setStatus("200");
246 outputBuilder.setHealth(getDatabaseHealth());
248 return Futures.immediateFuture(RpcResultBuilder.<DatabaseHealthOutput>status(true).withResult(outputBuilder.build()).build());
252 public ListenableFuture<RpcResult<AdminHealthOutput>> adminHealth(AdminHealthInput input) {
253 log.info("{}:admin-health invoked.", APP_NAME);
254 AdminHealthOutputBuilder outputBuilder = new AdminHealthOutputBuilder();
255 outputBuilder.setStatus("200");
256 outputBuilder.setHealth(getAdminHealth());
258 return Futures.immediateFuture(RpcResultBuilder.<AdminHealthOutput>status(true).withResult(outputBuilder.build()).build());
262 public ListenableFuture<RpcResult<HaltAkkaTrafficOutput>> haltAkkaTraffic(HaltAkkaTrafficInput input) {
263 log.info("{}:halt-akka-traffic invoked.", APP_NAME);
264 HaltAkkaTrafficOutputBuilder outputBuilder = new HaltAkkaTrafficOutputBuilder();
265 outputBuilder.setStatus("200");
266 modifyIpTables(IpTables.ADD, input.getNodeInfo().toArray());
268 return Futures.immediateFuture(RpcResultBuilder.<HaltAkkaTrafficOutput>status(true).withResult(outputBuilder.build()).build());
272 public ListenableFuture<RpcResult<ResumeAkkaTrafficOutput>> resumeAkkaTraffic(ResumeAkkaTrafficInput input) {
273 log.info("{}:resume-akka-traffic invoked.", APP_NAME);
274 ResumeAkkaTrafficOutputBuilder outputBuilder = new ResumeAkkaTrafficOutputBuilder();
275 outputBuilder.setStatus("200");
276 modifyIpTables(IpTables.DELETE, input.getNodeInfo().toArray());
278 return Futures.immediateFuture(RpcResultBuilder.<ResumeAkkaTrafficOutput>status(true).withResult(outputBuilder.build()).build());
282 public ListenableFuture<RpcResult<SiteIdentifierOutput>> siteIdentifier(SiteIdentifierInput input) {
283 log.info("{}:site-identifier invoked.", APP_NAME);
284 SiteIdentifierOutputBuilder outputBuilder = new SiteIdentifierOutputBuilder();
285 outputBuilder.setStatus("200");
286 outputBuilder.setId(siteIdentifier);
288 return Futures.immediateFuture(RpcResultBuilder.<SiteIdentifierOutput>status(true).withResult(outputBuilder.build()).build());
292 public ListenableFuture<RpcResult<FailoverOutput>> failover(FailoverInput input) {
293 log.info("{}:failover invoked.", APP_NAME);
294 FailoverOutputBuilder outputBuilder = new FailoverOutputBuilder();
295 if(siteConfiguration != SiteConfiguration.GEO) {
296 log.info("Cannot failover non-GEO site.");
297 outputBuilder.setMessage("Failover aborted. This is not a GEO configuration.");
298 outputBuilder.setStatus("400");
299 return Futures.immediateFuture(RpcResultBuilder.<FailoverOutput>status(true).withResult(outputBuilder.build()).build());
301 ArrayList<ClusterActor> activeSite = new ArrayList<>();
302 ArrayList<ClusterActor> standbySite = new ArrayList<>();
304 log.info("Performing preliminary cluster health check...");
305 // Necessary to populate all member info. Health is not used for judgement calls.
306 getControllerHealth();
308 log.info("Determining active site...");
309 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
310 String key = entry.getKey();
311 ClusterActor clusterActor = entry.getValue();
312 if(clusterActor.isVoting()) {
313 activeSite.add(clusterActor);
314 log.debug("Active Site member: {}", key);
317 standbySite.add(clusterActor);
318 log.debug("Standby Site member: {}", key);
322 String port = "true".equals(properties.getProperty(PropertyKeys.CONTROLLER_USE_SSL)) ? properties.getProperty(PropertyKeys.CONTROLLER_PORT_SSL) : properties.getProperty(PropertyKeys.CONTROLLER_PORT_HTTP);
324 if(Boolean.parseBoolean(input.getBackupData())) {
325 backupMdSal(activeSite, port);
328 if(!changeClusterVoting(outputBuilder, activeSite, standbySite, port))
329 return Futures.immediateFuture(RpcResultBuilder.<FailoverOutput>status(true).withResult(outputBuilder.build()).build());
331 if(Boolean.parseBoolean(input.getIsolate())) {
332 isolateSiteFromCluster(activeSite, standbySite, port);
334 if(Boolean.parseBoolean(input.getDownUnreachable())) {
335 downUnreachableNodes(activeSite, standbySite, port);
339 log.info("{}:failover complete.", APP_NAME);
341 outputBuilder.setMessage("Failover complete.");
342 outputBuilder.setStatus("200");
343 return Futures.immediateFuture(RpcResultBuilder.<FailoverOutput>status(true).withResult(outputBuilder.build()).build());
346 private void isolateSiteFromCluster(ArrayList<ClusterActor> activeSite, ArrayList<ClusterActor> standbySite, String port) {
347 log.info("Halting Akka traffic...");
348 for(ClusterActor actor : standbySite) {
350 log.info("Halting Akka traffic for: {}", actor.getNode());
351 // Build JSON with activeSite actor Node and actor AkkaPort
352 JSONObject akkaInput = new JSONObject();
353 JSONObject inputBlock = new JSONObject();
354 JSONArray votingStateArray = new JSONArray();
356 for(ClusterActor node : activeSite) {
357 nodeInfo = new JSONObject();
358 nodeInfo.put("node", node.getNode());
359 nodeInfo.put("port", node.getAkkaPort());
360 votingStateArray.put(nodeInfo);
362 inputBlock.put("node-info", votingStateArray);
363 akkaInput.put("input", inputBlock);
364 getRequestContent(httpProtocol + actor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:halt-akka-traffic", HttpMethod.POST, akkaInput.toString());
365 } catch(IOException e) {
366 log.error("Could not halt Akka traffic for: " + actor.getNode(), e);
371 private void downUnreachableNodes(ArrayList<ClusterActor> activeSite, ArrayList<ClusterActor> standbySite, String port) {
372 log.info("Setting site unreachable...");
373 JSONObject jolokiaInput = new JSONObject();
374 jolokiaInput.put("type", "EXEC");
375 jolokiaInput.put("mbean", "akka:type=Cluster");
376 jolokiaInput.put("operation", "down");
377 JSONArray arguments = new JSONArray();
378 for(ClusterActor actor : activeSite) {
379 // Build Jolokia input
380 // May need to change from akka port to actor.getAkkaPort()
381 arguments.put("akka.tcp://opendaylight-cluster-data@" + actor.getNode() + ":" + properties.getProperty(PropertyKeys.CONTROLLER_PORT_AKKA));
383 jolokiaInput.put("arguments", arguments);
384 log.debug("{}", jolokiaInput);
386 log.info("Setting nodes unreachable");
387 getRequestContent(httpProtocol + standbySite.get(0).getNode() + ":" + port + "/jolokia", HttpMethod.POST, jolokiaInput.toString());
388 } catch(IOException e) {
389 log.error("Error setting nodes unreachable", e);
393 private boolean changeClusterVoting(FailoverOutputBuilder outputBuilder, ArrayList<ClusterActor> activeSite, ArrayList<ClusterActor> standbySite, String port) {
394 log.info("Changing voting for all shards to standby site...");
396 JSONObject votingInput = new JSONObject();
397 JSONObject inputBlock = new JSONObject();
398 JSONArray votingStateArray = new JSONArray();
399 JSONObject memberVotingState;
400 for(ClusterActor actor : activeSite) {
401 memberVotingState = new JSONObject();
402 memberVotingState.put("member-name", actor.getMember());
403 memberVotingState.put("voting", false);
404 votingStateArray.put(memberVotingState);
406 for(ClusterActor actor : standbySite) {
407 memberVotingState = new JSONObject();
408 memberVotingState.put("member-name", actor.getMember());
409 memberVotingState.put("voting", true);
410 votingStateArray.put(memberVotingState);
412 inputBlock.put("member-voting-state", votingStateArray);
413 votingInput.put("input", inputBlock);
414 log.debug("{}", votingInput);
415 // Change voting all shards
416 getRequestContent(httpProtocol + self.getNode() + ":" + port + "/restconf/operations/cluster-admin:change-member-voting-states-for-all-shards", HttpMethod.POST, votingInput.toString());
417 } catch(IOException e) {
418 log.error("Changing voting", e);
419 outputBuilder.setMessage("Failover aborted. Failed to change voting.");
420 outputBuilder.setStatus("500");
426 private void backupMdSal(ArrayList<ClusterActor> activeSite, String port) {
427 log.info("Backing up data...");
429 log.info("Scheduling backup for: {}", activeSite.get(0).getNode());
430 getRequestContent(httpProtocol + activeSite.get(0).getNode() + ":" + port + "/restconf/operations/data-export-import:schedule-export", HttpMethod.POST, "{ \"input\": { \"run-at\": \"30\" } }");
431 } catch(IOException e) {
432 log.error("Error backing up MD-SAL", e);
434 for(ClusterActor actor : activeSite) {
437 log.info("Backing up data for: {}", actor.getNode());
438 getRequestContent(httpProtocol + actor.getNode() + ":" + port + "/restconf/operations/daexim-offsite-backup:backup-data", HttpMethod.POST);
439 } catch(IOException e) {
440 log.error("Error backing up data.", e);
445 private ListenableFuture<RpcResult<ClusterHealthOutput>> buildClusterHealthOutput(String statusCode) {
446 ClusterHealthOutputBuilder outputBuilder = new ClusterHealthOutputBuilder();
447 outputBuilder.setStatus(statusCode);
448 outputBuilder.setMembers((List) new ArrayList<Member>());
452 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
453 ClusterActor clusterActor = entry.getValue();
454 if(clusterActor.isUp() && !clusterActor.isUnreachable()) {
455 if(ClusterActor.SITE_1.equals(clusterActor.getSite()))
457 else if(ClusterActor.SITE_2.equals(clusterActor.getSite()))
460 outputBuilder.getMembers().add(new MemberBuilder(clusterActor).build());
462 if(siteConfiguration == SiteConfiguration.SOLO) {
463 outputBuilder.setSite1Health(HEALTHY);
465 else if(site1Health > 1) {
466 outputBuilder.setSite1Health(HEALTHY);
469 outputBuilder.setSite1Health(FAULTY);
472 if(siteConfiguration == SiteConfiguration.GEO && site2Health > 1) {
473 outputBuilder.setSite2Health(HEALTHY);
475 else if(siteConfiguration == SiteConfiguration.GEO) {
476 outputBuilder.setSite2Health(FAULTY);
479 RpcResult<ClusterHealthOutput> rpcResult = RpcResultBuilder.<ClusterHealthOutput>status(true).withResult(outputBuilder.build()).build();
480 return Futures.immediateFuture(rpcResult);
483 private ListenableFuture<RpcResult<SiteHealthOutput>> buildSiteHealthOutput(String statusCode, String adminHealth, String databaseHealth) {
484 SiteHealthOutputBuilder outputBuilder = new SiteHealthOutputBuilder();
485 outputBuilder.setStatus(statusCode);
486 outputBuilder.setSites((List) new ArrayList<Site>());
488 if(siteConfiguration != SiteConfiguration.GEO) {
490 SitesBuilder builder = new SitesBuilder();
491 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
492 ClusterActor clusterActor = entry.getValue();
493 if(clusterActor.isUp() && !clusterActor.isUnreachable()) {
497 if(siteConfiguration != SiteConfiguration.SOLO) {
498 builder.setHealth(HEALTHY);
499 builder.setRole("ACTIVE");
500 builder.setId(siteIdentifier);
503 builder = getSitesBuilder(healthyODLs, true, HEALTHY.equals(adminHealth), HEALTHY.equals(databaseHealth), siteIdentifier);
505 outputBuilder.getSites().add(builder.build());
508 int site1HealthyODLs = 0;
509 int site2HealthyODLs = 0;
510 boolean site1Voting = false;
511 boolean site2Voting = false;
512 boolean performedCrossSiteHealthCheck = false;
513 boolean crossSiteAdminHealthy = false;
514 boolean crossSiteDbHealthy = false;
515 String crossSiteIdentifier = "UNKNOWN_SITE";
516 String port = "true".equals(properties.getProperty(PropertyKeys.CONTROLLER_USE_SSL)) ? properties.getProperty(PropertyKeys.CONTROLLER_PORT_SSL) : properties.getProperty(PropertyKeys.CONTROLLER_PORT_HTTP);
518 // Make calls over to site 2 healthchecks
519 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
520 ClusterActor clusterActor = entry.getValue();
521 if(clusterActor.isUp() && !clusterActor.isUnreachable()) {
522 if(ClusterActor.SITE_1.equals(clusterActor.getSite())) {
524 if(clusterActor.isVoting()) {
530 if(clusterActor.isVoting()) {
533 if(!performedCrossSiteHealthCheck) {
535 String content = getRequestContent(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:site-identifier", HttpMethod.POST);
536 crossSiteIdentifier = new JSONObject(content).getJSONObject("output").getString("id");
537 crossSiteDbHealthy = crossSiteHealthRequest(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:database-health");
538 crossSiteAdminHealthy = crossSiteHealthRequest(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:admin-health");
539 performedCrossSiteHealthCheck = true;
540 } catch(Exception e) {
541 log.info("Cannot get site identifier from {}", clusterActor.getNode());
542 log.error("Site Health Error", e);
548 SitesBuilder builder = getSitesBuilder(site1HealthyODLs, site1Voting, HEALTHY.equals(adminHealth), HEALTHY.equals(databaseHealth), siteIdentifier);
549 outputBuilder.getSites().add(builder.build());
550 builder = getSitesBuilder(site2HealthyODLs, site2Voting, crossSiteAdminHealthy, crossSiteDbHealthy, crossSiteIdentifier);
551 outputBuilder.getSites().add(builder.build());
554 // Make calls over to site 1 healthchecks
555 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
556 ClusterActor clusterActor = entry.getValue();
557 if(clusterActor.isUp() && !clusterActor.isUnreachable()) {
558 if(ClusterActor.SITE_1.equals(clusterActor.getSite())) {
560 if(clusterActor.isVoting()) {
563 if(!performedCrossSiteHealthCheck) {
565 String content = getRequestContent(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:site-identifier", HttpMethod.POST);
566 crossSiteIdentifier = new JSONObject(content).getJSONObject("output").getString("id");
567 crossSiteDbHealthy = crossSiteHealthRequest(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:database-health");
568 crossSiteAdminHealthy = crossSiteHealthRequest(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:admin-health");
569 performedCrossSiteHealthCheck = true;
570 } catch(Exception e) {
571 log.info("Cannot get site identifier from {}", clusterActor.getNode());
572 log.error("Site Health Error", e);
578 if(clusterActor.isVoting()) {
585 SitesBuilder builder = getSitesBuilder(site1HealthyODLs, site1Voting, crossSiteAdminHealthy, crossSiteDbHealthy, crossSiteIdentifier);
586 outputBuilder.getSites().add(builder.build());
587 builder = getSitesBuilder(site2HealthyODLs, site2Voting, HEALTHY.equals(adminHealth), HEALTHY.equals(databaseHealth), siteIdentifier);
588 outputBuilder.getSites().add(builder.build());
592 RpcResult<SiteHealthOutput> rpcResult = RpcResultBuilder.<SiteHealthOutput>status(true).withResult(outputBuilder.build()).build();
593 return Futures.immediateFuture(rpcResult);
596 private SitesBuilder getSitesBuilder(int siteHealthyODLs, boolean siteVoting, boolean adminHealthy, boolean dbHealthy, String siteIdentifier) {
597 SitesBuilder builder = new SitesBuilder();
598 if(siteHealthyODLs > 1) {
599 builder.setHealth(HEALTHY);
602 log.warn("{} Healthy ODLs: {}", siteIdentifier, siteHealthyODLs);
603 builder.setHealth(FAULTY);
606 log.warn("{} Admin Health: {}", siteIdentifier, FAULTY);
607 builder.setHealth(FAULTY);
610 log.warn("{} Database Health: {}", siteIdentifier, FAULTY);
611 builder.setHealth(FAULTY);
614 builder.setRole("ACTIVE");
617 builder.setRole("STANDBY");
619 builder.setId(siteIdentifier);
623 private boolean isSite1() {
624 int memberNumber = Integer.parseInt(member.split("-")[1]);
625 boolean isSite1 = memberNumber < 4;
626 log.info("isSite1(): {}", isSite1);
630 private void parseSeedNodes(String line) {
631 memberMap = new HashMap<>();
632 line = line.substring(line.indexOf("[\""), line.indexOf(']'));
633 String[] splits = line.split(",");
635 for(int ndx = 0; ndx < splits.length; ndx++) {
636 String nodeName = splits[ndx];
637 int delimLocation = nodeName.indexOf('@');
638 String port = nodeName.substring(splits[ndx].indexOf(':', delimLocation) + 1, splits[ndx].indexOf('"', splits[ndx].indexOf(':')));
639 splits[ndx] = nodeName.substring(delimLocation + 1, splits[ndx].indexOf(':', delimLocation));
640 log.info("Adding node: {}:{}", splits[ndx], port);
641 ClusterActor clusterActor = new ClusterActor();
642 clusterActor.setNode(splits[ndx]);
643 clusterActor.setAkkaPort(port);
644 clusterActor.setMember("member-" + (ndx + 1));
646 clusterActor.setSite(ClusterActor.SITE_1);
649 clusterActor.setSite(ClusterActor.SITE_2);
652 if(member.equals(clusterActor.getMember())) {
655 memberMap.put(clusterActor.getNode(), clusterActor);
656 log.info("{}", clusterActor);
659 if(memberMap.size() == 1) {
660 log.info("1 member found. This is a solo environment.");
661 siteConfiguration = SiteConfiguration.SOLO;
663 else if(memberMap.size() == 3) {
664 log.info("This is a single site.");
665 siteConfiguration = SiteConfiguration.SINGLE;
667 else if(memberMap.size() == 6) {
668 log.info("This is a georedundant site.");
669 siteConfiguration = SiteConfiguration.GEO;
673 private void getMemberStatus(ClusterActor clusterActor) throws IOException {
674 log.info("Getting member status for {}", clusterActor.getNode());
675 String content = getRequestContent(httpProtocol + clusterActor.getNode() + jolokiaClusterPath, HttpMethod.GET);
677 JSONObject responseJson = new JSONObject(content);
678 JSONObject responseValue = responseJson.getJSONObject(VALUE);
679 clusterActor.setUp("Up".equals(responseValue.getString("MemberStatus")));
680 clusterActor.setUnreachable(false);
681 } catch(JSONException e) {
682 log.error("Error parsing response from {}", clusterActor.getNode(), e);
683 clusterActor.setUp(false);
684 clusterActor.setUnreachable(true);
688 private void getShardStatus(ClusterActor clusterActor) throws IOException {
689 log.info("Getting shard status for {}", clusterActor.getNode());
690 String content = getRequestContent(httpProtocol + clusterActor.getNode() + shardManagerPath, HttpMethod.GET);
692 JSONObject responseValue = new JSONObject(content).getJSONObject(VALUE);
693 JSONArray shardList = responseValue.getJSONArray("LocalShards");
695 String pattern = "-config$";
696 Pattern r = Pattern.compile(pattern);
698 for(int ndx = 0; ndx < shardList.length(); ndx++) {
699 String configShardName = shardList.getString(ndx);
700 m = r.matcher(configShardName);
701 String operationalShardName = m.replaceFirst("-operational");
702 String shardConfigPath = String.format(shardPathTemplate, configShardName);
703 String shardOperationalPath = String.format(shardPathTemplate, operationalShardName).replace("Config", "Operational");
704 extractShardInfo(clusterActor, configShardName, shardConfigPath);
705 extractShardInfo(clusterActor, operationalShardName, shardOperationalPath);
707 } catch(JSONException e) {
708 log.error("Error parsing response from " + clusterActor.getNode(), e);
712 private void extractShardInfo(ClusterActor clusterActor, String shardName, String shardPath) throws IOException {
713 log.info("Extracting shard info for {}", shardName);
714 log.debug("Pulling config info for {} from: {}", shardName, shardPath);
715 String content = getRequestContent(httpProtocol + clusterActor.getNode() + shardPath, HttpMethod.GET);
716 log.debug("Response: {}", content);
719 JSONObject shardValue = new JSONObject(content).getJSONObject(VALUE);
720 clusterActor.setVoting(shardValue.getBoolean("Voting"));
721 if(shardValue.getString("PeerAddresses").length() > 0) {
722 clusterActor.getReplicaShards().add(shardName);
723 if(shardValue.getString("Leader").startsWith(clusterActor.getMember())) {
724 clusterActor.getShardLeader().add(shardName);
728 clusterActor.getNonReplicaShards().add(shardName);
730 JSONArray followerInfo = shardValue.getJSONArray("FollowerInfo");
731 for(int followerNdx = 0; followerNdx < followerInfo.length(); followerNdx++) {
732 int commitIndex = shardValue.getInt("CommitIndex");
733 int matchIndex = followerInfo.getJSONObject(followerNdx).getInt("matchIndex");
734 if(commitIndex != -1 && matchIndex != -1) {
735 int commitsBehind = commitIndex - matchIndex;
736 clusterActor.getCommits().put(followerInfo.getJSONObject(followerNdx).getString("id"), commitsBehind);
739 } catch(JSONException e) {
740 log.error("Error parsing response from " + clusterActor.getNode(), e);
744 private void getControllerHealth() {
745 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
746 ClusterActor clusterActor = entry.getValue();
747 String key = entry.getKey();
749 // First flush out the old values
750 clusterActor.flush();
751 log.info("Gathering info for {}", clusterActor.getNode());
752 getMemberStatus(clusterActor);
753 getShardStatus(clusterActor);
754 log.info("MemberInfo:\n{}", clusterActor);
755 } catch(IOException e) {
756 log.error("Connection Error", e);
757 memberMap.get(key).setUnreachable(true);
758 memberMap.get(key).setUp(false);
759 log.info("MemberInfo:\n{}", memberMap.get(key));
764 private void modifyIpTables(IpTables task, Object[] nodeInfo) {
765 log.info("Modifying IPTables rules...");
766 if(task == IpTables.ADD) {
767 for(Object node : nodeInfo) {
768 org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.halt.akka.traffic.input.NodeInfo n =
769 (org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.halt.akka.traffic.input.NodeInfo) node;
770 log.info("Isolating {}", n.getNode());
771 executeCommand(String.format("sudo /sbin/iptables -A INPUT -p tcp --destination-port %s -j DROP -s %s", properties.get(PropertyKeys.CONTROLLER_PORT_AKKA), n.getNode()));
772 executeCommand(String.format("sudo /sbin/iptables -A OUTPUT -p tcp --destination-port %s -j DROP -s %s", n.getPort(), n.getNode()));
775 } else if(task == IpTables.DELETE) {
776 for(Object node : nodeInfo) {
777 org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.resume.akka.traffic.input.NodeInfo n =
778 (org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.resume.akka.traffic.input.NodeInfo) node;
779 log.info("De-isolating {}", n.getNode());
780 executeCommand(String.format("sudo /sbin/iptables -D INPUT -p tcp --destination-port %s -j DROP -s %s", properties.get(PropertyKeys.CONTROLLER_PORT_AKKA), n.getNode()));
781 executeCommand(String.format("sudo /sbin/iptables -D OUTPUT -p tcp --destination-port %s -j DROP -s %s", n.getPort(), n.getNode()));
785 executeCommand("sudo /sbin/iptables -L");
788 private void executeCommand(String command) {
789 log.info("Executing command: {}", command);
790 String[] cmd = command.split(" ");
792 Process p = Runtime.getRuntime().exec(cmd);
793 BufferedReader bufferedReader = new BufferedReader(new InputStreamReader(p.getInputStream()));
795 StringBuilder content = new StringBuilder();
796 while((inputLine = bufferedReader.readLine()) != null) {
797 content.append(inputLine);
799 bufferedReader.close();
800 log.info("{}", content);
801 } catch(IOException e) {
802 log.error("Error executing command", e);
806 private boolean crossSiteHealthRequest(String path) throws IOException {
807 String content = getRequestContent(path, HttpMethod.POST);
809 JSONObject responseJson = new JSONObject(content);
810 JSONObject responseValue = responseJson.getJSONObject(VALUE);
811 return HEALTHY.equals(responseValue.getString("health"));
812 } catch(JSONException e) {
813 log.error("Error parsing JSON", e);
814 throw new IOException();
818 private String getAdminHealth() {
819 String protocol = "true".equals(properties.getProperty(PropertyKeys.ADM_USE_SSL)) ? "https://" : "http://";
820 String port = "true".equals(properties.getProperty(PropertyKeys.ADM_USE_SSL)) ? properties.getProperty(PropertyKeys.ADM_PORT_SSL) : properties.getProperty(PropertyKeys.ADM_PORT_HTTP);
821 String path = protocol + properties.getProperty(PropertyKeys.ADM_FQDN) + ":" + port + properties.getProperty(PropertyKeys.ADM_HEALTHCHECK);
822 log.info("Requesting healthcheck from {}", path);
824 int response = getRequestStatus(path, HttpMethod.GET);
825 log.info("Response: {}", response);
829 } catch(IOException e) {
830 log.error("Problem getting ADM health.", e);
835 private String getDatabaseHealth() {
836 log.info("Determining database health...");
838 Connection connection = dbLib.getConnection();
839 log.info("DBLib isActive(): {}", dbLib.isActive());
840 log.info("DBLib isReadOnly(): {}", connection.isReadOnly());
841 log.info("DBLib isClosed(): {}", connection.isClosed());
842 if(!dbLib.isActive() || connection.isClosed() || connection.isReadOnly()) {
843 log.warn("Database is FAULTY");
848 log.info("Database is HEALTHY");
849 } catch(SQLException e) {
850 log.error("Database is FAULTY");
851 log.error("Error", e);
858 private String getRequestContent(String path, HttpMethod method) throws IOException {
859 return getRequestContent(path, method, null);
862 private String getRequestContent(String path, HttpMethod method, String input) throws IOException {
863 HttpURLConnection connection = getConnection(path);
864 connection.setRequestMethod(method.getMethod());
865 connection.setDoInput(true);
868 sendPayload(input, connection);
871 BufferedReader bufferedReader = new BufferedReader(new InputStreamReader(connection.getInputStream()));
873 StringBuilder content = new StringBuilder();
874 while((inputLine = bufferedReader.readLine()) != null) {
875 content.append(inputLine);
877 bufferedReader.close();
878 connection.disconnect();
879 return content.toString();
882 private int getRequestStatus(String path, HttpMethod method) throws IOException {
883 return getRequestStatus(path, method, null);
886 private int getRequestStatus(String path, HttpMethod method, String input) throws IOException {
887 HttpURLConnection connection = getConnection(path);
888 connection.setRequestMethod(method.getMethod());
889 connection.setDoInput(true);
892 sendPayload(input, connection);
894 int response = connection.getResponseCode();
895 log.info("Received {} response code from {}", response, path);
896 connection.disconnect();
900 private void sendPayload(String input, HttpURLConnection connection) throws IOException {
901 byte[] out = input.getBytes(StandardCharsets.UTF_8);
902 int length = out.length;
904 connection.setFixedLengthStreamingMode(length);
905 connection.setRequestProperty("Content-Type", "application/json");
906 connection.setDoOutput(true);
907 connection.connect();
908 try(OutputStream os = connection.getOutputStream()) {
913 private HttpURLConnection getConnection(String host) throws IOException {
914 log.info("Getting connection to: {}", host);
915 URL url = new URL(host);
916 String auth = "Basic " + javax.xml.bind.DatatypeConverter.printBase64Binary(credentials.getBytes());
917 HttpURLConnection connection = (HttpURLConnection) url.openConnection();
918 connection.addRequestProperty("Authorization", auth);
919 connection.setRequestProperty("Connection", "keep-alive");
920 connection.setRequestProperty("Proxy-Connection", "keep-alive");
929 enum SiteConfiguration {
939 private String method;
940 HttpMethod(String method) {
941 this.method = method;
943 public String getMethod() {
949 static final String SITE_IDENTIFIER = "site.identifier";
950 static final String CONTROLLER_USE_SSL = "controller.useSsl";
951 static final String CONTROLLER_PORT_SSL = "controller.port.ssl";
952 static final String CONTROLLER_PORT_HTTP = "controller.port.http";
953 static final String CONTROLLER_PORT_AKKA = "controller.port.akka";
954 static final String CONTROLLER_CREDENTIALS = "controller.credentials";
955 static final String AKKA_CONF_LOCATION = "akka.conf.location";
956 static final String MBEAN_CLUSTER = "mbean.cluster";
957 static final String MBEAN_SHARD_MANAGER = "mbean.shardManager";
958 static final String MBEAN_SHARD_CONFIG = "mbean.shard.config";
959 static final String ADM_USE_SSL = "adm.useSsl";
960 static final String ADM_PORT_SSL = "adm.port.ssl";
961 static final String ADM_PORT_HTTP = "adm.port.http";
962 static final String ADM_FQDN = "adm.fqdn";
963 static final String ADM_HEALTHCHECK= "adm.healthcheck";