2 * ============LICENSE_START=======================================================
4 * ================================================================================
5 * Copyright (C) 2018 AT&T Intellectual Property. All rights
7 * ================================================================================
8 * Licensed under the Apache License, Version 2.0 (the "License");
9 * you may not use this file except in compliance with the License.
10 * You may obtain a copy of the License at
12 * http://www.apache.org/licenses/LICENSE-2.0
14 * Unless required by applicable law or agreed to in writing, software
15 * distributed under the License is distributed on an "AS IS" BASIS,
16 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
17 * See the License for the specific language governing permissions and
18 * limitations under the License.
19 * ============LICENSE_END=========================================================
22 package org.onap.ccsdk.sli.plugins;
24 import java.io.BufferedReader;
26 import java.io.FileInputStream;
27 import java.io.FileReader;
28 import java.io.IOException;
29 import java.io.InputStreamReader;
30 import java.io.OutputStream;
31 import java.net.HttpURLConnection;
33 import java.nio.charset.StandardCharsets;
34 import java.sql.SQLException;
35 import java.util.ArrayList;
36 import java.util.Collection;
37 import java.util.HashMap;
38 import java.util.Properties;
39 import java.util.List;
40 import java.util.concurrent.ExecutionException;
41 import java.util.concurrent.ExecutorService;
42 import java.util.concurrent.Executors;
43 import java.util.regex.Matcher;
44 import java.util.regex.Pattern;
45 import javax.annotation.Nonnull;
47 import com.google.common.util.concurrent.CheckedFuture;
48 import com.google.common.util.concurrent.Futures;
49 import com.google.common.util.concurrent.ListenableFuture;
51 import org.onap.ccsdk.sli.core.dblib.DbLibService;
52 import org.onap.ccsdk.sli.plugins.data.ClusterActor;
53 import org.onap.ccsdk.sli.plugins.data.MemberBuilder;
55 import org.json.JSONArray;
56 import org.json.JSONException;
57 import org.json.JSONObject;
59 import org.opendaylight.controller.cluster.datastore.DistributedDataStoreInterface;
60 import org.opendaylight.controller.md.sal.binding.api.DataBroker;
61 import org.opendaylight.controller.md.sal.binding.api.DataTreeChangeListener;
62 import org.opendaylight.controller.md.sal.binding.api.NotificationPublishService;
63 import org.opendaylight.controller.md.sal.binding.api.WriteTransaction;
64 import org.opendaylight.controller.md.sal.common.api.data.TransactionCommitFailedException;
65 import org.opendaylight.controller.sal.binding.api.BindingAwareBroker;
66 import org.opendaylight.controller.sal.binding.api.RpcProviderRegistry;
67 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.AdminHealthInput;
68 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.AdminHealthOutput;
69 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.AdminHealthOutputBuilder;
70 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ClusterHealthInput;
71 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ClusterHealthOutput;
72 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ClusterHealthOutputBuilder;
73 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.DatabaseHealthInput;
74 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.DatabaseHealthOutput;
75 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.DatabaseHealthOutputBuilder;
76 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.FailoverInput;
77 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.FailoverOutput;
78 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.FailoverOutputBuilder;
79 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.GrToolkitService;
80 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.HaltAkkaTrafficInput;
81 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.HaltAkkaTrafficOutput;
82 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.HaltAkkaTrafficOutputBuilder;
83 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.Member;
84 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ResumeAkkaTrafficInput;
85 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ResumeAkkaTrafficOutput;
86 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ResumeAkkaTrafficOutputBuilder;
87 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.Site;
88 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteHealthInput;
89 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteHealthOutput;
90 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteHealthOutputBuilder;
91 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteIdentifierInput;
92 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteIdentifierOutput;
93 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteIdentifierOutputBuilder;
94 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.site.health.output.SitesBuilder;
95 import org.opendaylight.yangtools.yang.common.RpcResult;
96 import org.opendaylight.yangtools.yang.common.RpcResultBuilder;
98 import org.slf4j.Logger;
99 import org.slf4j.LoggerFactory;
101 public class GrToolkitProvider implements AutoCloseable, GrToolkitService, DataTreeChangeListener {
102 private static final String PROPERTIES_FILE = System.getenv("SDNC_CONFIG_DIR") + "/gr-toolkit.properties";
103 private static final String HEALTHY = "HEALTHY";
104 private static final String FAULTY = "FAULTY";
105 private static String AKKA_CONFIG;
106 private static String JOLOKIA_CLUSTER_PATH;
107 private static String SHARD_MANAGER_PATH;
108 private static String SHARD_PATH_TEMPLATE;
109 private static String CREDENTIALS;
110 private static String HTTP_PROTOCOL;
111 private static String SITE_IDENTIFIER = System.getenv("SITE_NAME");
112 private final Logger log = LoggerFactory.getLogger(GrToolkitProvider.class);
113 private final String appName = "gr-toolkit";
114 private final ExecutorService executor;
115 protected DataBroker dataBroker;
116 protected NotificationPublishService notificationService;
117 protected RpcProviderRegistry rpcRegistry;
118 protected BindingAwareBroker.RpcRegistration<GrToolkitService> rpcRegistration;
119 protected DbLibService dbLib;
120 private String member;
121 private ClusterActor self;
122 private HashMap<String, ClusterActor> members;
123 private SiteConfiguration siteConfiguration;
124 private Properties properties;
125 private DistributedDataStoreInterface configDatastore;
126 public GrToolkitProvider(DataBroker dataBroker,
127 NotificationPublishService notificationProviderService,
128 RpcProviderRegistry rpcProviderRegistry,
129 DistributedDataStoreInterface configDatastore,
130 DbLibService dbLibService) {
131 this.log.info("Creating provider for " + appName);
132 this.executor = Executors.newFixedThreadPool(1);
133 this.dataBroker = dataBroker;
134 this.notificationService = notificationProviderService;
135 this.rpcRegistry = rpcProviderRegistry;
136 this.configDatastore = configDatastore;
137 this.dbLib = dbLibService;
141 public void initialize() {
142 log.info("Initializing provider for " + appName);
143 // Create the top level containers
146 GrToolkitUtil.loadProperties();
147 } catch (Exception e) {
148 log.error("Caught Exception while trying to load properties file.", e);
154 rpcRegistration = rpcRegistry.addRpcImplementation(GrToolkitService.class, this);
155 log.info("Initialization complete for " + appName);
158 private void setProperties() {
159 log.info("Loading properties from " + PROPERTIES_FILE);
160 properties = new Properties();
161 File propertiesFile = new File(PROPERTIES_FILE);
162 if(!propertiesFile.exists()) {
163 log.warn("Properties file not found.");
166 try(FileInputStream fileInputStream = new FileInputStream(propertiesFile)) {
167 properties.load(fileInputStream);
168 if(!properties.containsKey("site.identifier")) {
169 properties.put("site.identifier", "Unknown Site");
171 String port = "true".equals(properties.getProperty("controller.useSsl").trim()) ? properties.getProperty("controller.port.ssl").trim() : properties.getProperty("controller.port.http").trim();
172 HTTP_PROTOCOL = "true".equals(properties.getProperty("controller.useSsl").trim()) ? "https://" : "http://";
173 AKKA_CONFIG = properties.getProperty("akka.conf.location").trim();
174 JOLOKIA_CLUSTER_PATH = ":" + port + properties.getProperty("mbean.cluster").trim();
175 SHARD_MANAGER_PATH = ":" + port + properties.getProperty("mbean.shardManager").trim();
176 SHARD_PATH_TEMPLATE = ":" + port + properties.getProperty("mbean.shard.config").trim();
177 if(SITE_IDENTIFIER == null || SITE_IDENTIFIER.isEmpty()) {
178 SITE_IDENTIFIER = properties.getProperty("site.identifier").trim();
180 CREDENTIALS = properties.getProperty("controller.credentials").trim();
181 log.info("Loaded properties.");
182 } catch(IOException e) {
183 log.error("Error loading properties.", e);
187 private void defineMembers() {
188 member = configDatastore.getActorContext().getCurrentMemberName().getName();
189 log.info("Cluster member: " + member);
191 log.info("Parsing akka.conf for cluster members...");
193 File akkaConfig = new File(AKKA_CONFIG);
194 FileReader fileReader = new FileReader(akkaConfig);
195 BufferedReader bufferedReader = new BufferedReader(fileReader);
197 while((line = bufferedReader.readLine()) != null) {
198 if(line.contains("seed-nodes =")) {
199 parseSeedNodes(line);
203 bufferedReader.close();
205 } catch(IOException e) {
206 log.error("Couldn't load akka", e);
208 log.info("self:\n{}", self.toString());
211 private void createContainers() {
212 final WriteTransaction t = dataBroker.newReadWriteTransaction();
214 CheckedFuture<Void, TransactionCommitFailedException>checkedFuture = t.submit();
216 log.info("Create Containers succeeded!");
217 } catch (InterruptedException | ExecutionException e) {
218 log.error("Create Containers Failed: " + e);
219 log.error("context", e);
223 protected void initializeChild() {
224 // Override if you have custom initialization intelligence
228 public void close() throws Exception {
229 log.info("Closing provider for " + appName);
231 rpcRegistration.close();
232 log.info("Successfully closed provider for " + appName);
236 public void onDataTreeChanged(@Nonnull Collection changes) {
237 log.info("onDataTreeChanged() called. but there is no change here");
241 public ListenableFuture<RpcResult<ClusterHealthOutput>> clusterHealth(ClusterHealthInput input) {
242 log.info(appName + ":cluster-health invoked.");
243 getControllerHealth();
244 return buildClusterHealthOutput("200");
248 public ListenableFuture<RpcResult<SiteHealthOutput>> siteHealth(SiteHealthInput input) {
249 log.info(appName + ":site-health invoked.");
250 getControllerHealth();
251 return buildSiteHealthOutput("200", getAdminHealth(), getDatabaseHealth());
255 public ListenableFuture<RpcResult<DatabaseHealthOutput>> databaseHealth(DatabaseHealthInput input) {
256 log.info(appName + ":database-health invoked.");
257 DatabaseHealthOutputBuilder outputBuilder = new DatabaseHealthOutputBuilder();
258 outputBuilder.setStatus("200");
259 outputBuilder.setHealth(getDatabaseHealth());
261 return Futures.immediateFuture(RpcResultBuilder.<DatabaseHealthOutput>status(true).withResult(outputBuilder.build()).build());
265 public ListenableFuture<RpcResult<AdminHealthOutput>> adminHealth(AdminHealthInput input) {
266 log.info(appName + ":admin-health invoked.");
267 AdminHealthOutputBuilder outputBuilder = new AdminHealthOutputBuilder();
268 outputBuilder.setStatus("200");
269 outputBuilder.setHealth(getAdminHealth());
271 return Futures.immediateFuture(RpcResultBuilder.<AdminHealthOutput>status(true).withResult(outputBuilder.build()).build());
275 public ListenableFuture<RpcResult<HaltAkkaTrafficOutput>> haltAkkaTraffic(HaltAkkaTrafficInput input) {
276 log.info(appName + ":halt-akka-traffic invoked.");
277 HaltAkkaTrafficOutputBuilder outputBuilder = new HaltAkkaTrafficOutputBuilder();
278 outputBuilder.setStatus("200");
279 modifyIpTables(IpTables.Add, input.getNodeInfo().toArray());
281 return Futures.immediateFuture(RpcResultBuilder.<HaltAkkaTrafficOutput>status(true).withResult(outputBuilder.build()).build());
285 public ListenableFuture<RpcResult<ResumeAkkaTrafficOutput>> resumeAkkaTraffic(ResumeAkkaTrafficInput input) {
286 log.info(appName + ":resume-akka-traffic invoked.");
287 ResumeAkkaTrafficOutputBuilder outputBuilder = new ResumeAkkaTrafficOutputBuilder();
288 outputBuilder.setStatus("200");
289 modifyIpTables(IpTables.Delete, input.getNodeInfo().toArray());
291 return Futures.immediateFuture(RpcResultBuilder.<ResumeAkkaTrafficOutput>status(true).withResult(outputBuilder.build()).build());
295 public ListenableFuture<RpcResult<SiteIdentifierOutput>> siteIdentifier(SiteIdentifierInput input) {
296 log.info(appName + ":site-identifier invoked.");
297 SiteIdentifierOutputBuilder outputBuilder = new SiteIdentifierOutputBuilder();
298 outputBuilder.setStatus("200");
299 outputBuilder.setId(SITE_IDENTIFIER);
301 return Futures.immediateFuture(RpcResultBuilder.<SiteIdentifierOutput>status(true).withResult(outputBuilder.build()).build());
305 public ListenableFuture<RpcResult<FailoverOutput>> failover(FailoverInput input) {
306 log.info(appName + ":failover invoked.");
307 FailoverOutputBuilder outputBuilder = new FailoverOutputBuilder();
308 if(siteConfiguration != SiteConfiguration.Geo) {
309 log.info("Cannot failover non-Geo site.");
310 outputBuilder.setMessage("Failover aborted. This is not a Geo configuration.");
311 outputBuilder.setStatus("400");
312 return Futures.immediateFuture(RpcResultBuilder.<FailoverOutput>status(true).withResult(outputBuilder.build()).build());
314 ArrayList<ClusterActor> activeSite = new ArrayList<>();
315 ArrayList<ClusterActor> standbySite = new ArrayList<>();
317 log.info("Performing preliminary cluster health check...");
318 // Necessary to populate all member info. Health is not used for judgement calls.
319 getControllerHealth();
321 log.info("Determining active site...");
322 for(String key : members.keySet()) {
323 if(members.get(key).isVoting()) {
324 activeSite.add(members.get(key));
325 log.debug("Active Site member: " + key);
328 standbySite.add(members.get(key));
329 log.debug("Standby Site member: " + key);
333 String port = "true".equals(properties.getProperty("controller.useSsl")) ? properties.getProperty("controller.port.ssl") : properties.getProperty("controller.port.http");
335 if(Boolean.parseBoolean(input.getBackupData())) {
336 log.info("Backing up data...");
337 for(ClusterActor actor : activeSite) {
340 log.info("Scheduling backup for: " + actor.getNode());
341 getRequestContent(HTTP_PROTOCOL + actor.getNode() + ":" + port + "/restconf/operations/data-export-import:schedule-export", HttpMethod.Post, "");
344 log.info("Backing up data for: " + actor.getNode());
345 getRequestContent(HTTP_PROTOCOL + actor.getNode() + ":" + port + "/restconf/operations/daexim-offsite-backup:backup-data", HttpMethod.Post);
346 } catch(IOException e) {
347 log.error("Error backing up data.", e);
351 catch(IOException e) {
352 log.error("Error exporting MD-SAL data.", e);
357 log.info("Changing voting for all shards to standby site...");
359 JSONObject votingInput = new JSONObject();
360 JSONObject inputBlock = new JSONObject();
361 JSONArray votingStateArray = new JSONArray();
362 JSONObject memberVotingState;
363 for(ClusterActor actor : activeSite) {
364 memberVotingState = new JSONObject();
365 memberVotingState.put("member-name", actor.getMember());
366 memberVotingState.put("voting", false);
367 votingStateArray.put(memberVotingState);
369 for(ClusterActor actor : standbySite) {
370 memberVotingState = new JSONObject();
371 memberVotingState.put("member-name", actor.getMember());
372 memberVotingState.put("voting", true);
373 votingStateArray.put(memberVotingState);
375 inputBlock.put("member-voting-state", votingStateArray);
376 votingInput.put("input", inputBlock);
377 log.debug(votingInput.toString(2));
378 // Change voting all shards
379 getRequestContent(HTTP_PROTOCOL + self.getNode() + ":" + port + "/restconf/operations/cluster-admin:change-member-voting-states-for-all-shards", HttpMethod.Post, votingInput.toString());
380 } catch(IOException e) {
381 log.error("Changing voting", e);
382 outputBuilder.setMessage("Failover aborted. Failed to change voting.");
383 outputBuilder.setStatus("500");
384 return Futures.immediateFuture(RpcResultBuilder.<FailoverOutput>status(true).withResult(outputBuilder.build()).build());
388 log.info("Halting Akka traffic...");
389 for(ClusterActor actor : standbySite) {
391 log.info("Halting Akka traffic for: " + actor.getNode());
392 // Build JSON with activeSite actor.getNode() and actor.getAkkaPort();
393 JSONObject akkaInput = new JSONObject();
394 JSONObject inputBlock = new JSONObject();
395 JSONArray votingStateArray = new JSONArray();
397 for(ClusterActor node : activeSite) {
398 nodeInfo = new JSONObject();
399 nodeInfo.put("node", node.getNode());
400 nodeInfo.put("port", node.getAkkaPort());
401 votingStateArray.put(nodeInfo);
403 inputBlock.put("node-info", votingStateArray);
404 akkaInput.put("input", inputBlock);
405 getRequestContent(HTTP_PROTOCOL + actor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:halt-akka-traffic", HttpMethod.Post, akkaInput.toString());
406 } catch(IOException e) {
407 log.error("Could not halt Akka traffic for: " + actor.getNode(), e);
412 log.info("Setting site unreachable...");
413 JSONObject jolokiaInput = new JSONObject();
414 jolokiaInput.put("type", "EXEC");
415 jolokiaInput.put("mbean", "akka:type=Cluster");
416 jolokiaInput.put("operation", "down");
417 JSONArray arguments = new JSONArray();
418 for(ClusterActor actor : activeSite) {
419 // Build Jolokia input
420 //TODO: May need to change from akka port to actor.getAkkaPort()
421 arguments.put("akka.tcp://opendaylight-cluster-data@" + actor.getNode() + ":" + properties.getProperty("controller.port.akka"));
423 jolokiaInput.put("arguments", arguments);
424 log.debug(jolokiaInput.toString(2));
426 log.info("Setting nodes unreachable");
427 getRequestContent(HTTP_PROTOCOL + standbySite.get(0).getNode() + ":" + port + "/jolokia", HttpMethod.Post, jolokiaInput.toString());
428 } catch(IOException e) {
429 log.error("Error setting nodes unreachable", e);
432 log.info(appName + ":failover complete.");
434 outputBuilder.setMessage("Failover complete.");
435 outputBuilder.setStatus("200");
436 return Futures.immediateFuture(RpcResultBuilder.<FailoverOutput>status(true).withResult(outputBuilder.build()).build());
439 private ListenableFuture<RpcResult<ClusterHealthOutput>> buildClusterHealthOutput(String statusCode) {
440 ClusterHealthOutputBuilder outputBuilder = new ClusterHealthOutputBuilder();
441 outputBuilder.setStatus(statusCode);
442 outputBuilder.setMembers((List) new ArrayList<Member>());
446 for(String key : members.keySet()) {
447 if(members.get(key).isUp() && !members.get(key).isUnreachable()) {
448 if(ClusterActor.SITE_1.equals(members.get(key).getSite()))
450 else if(ClusterActor.SITE_2.equals(members.get(key).getSite()))
453 outputBuilder.getMembers().add(new MemberBuilder(members.get(key)).build());
455 if(siteConfiguration == SiteConfiguration.Solo) {
456 outputBuilder.setSite1Health(HEALTHY);
459 if(site1Health > 1) {
460 outputBuilder.setSite1Health(HEALTHY);
463 outputBuilder.setSite1Health(FAULTY);
466 if(siteConfiguration == SiteConfiguration.Geo) {
467 if(site2Health > 1) {
468 outputBuilder.setSite2Health(HEALTHY);
471 outputBuilder.setSite2Health(FAULTY);
475 RpcResult<ClusterHealthOutput> rpcResult = RpcResultBuilder.<ClusterHealthOutput>status(true).withResult(outputBuilder.build()).build();
476 return Futures.immediateFuture(rpcResult);
479 private ListenableFuture<RpcResult<SiteHealthOutput>> buildSiteHealthOutput(String statusCode, String adminHealth, String databaseHealth) {
480 SiteHealthOutputBuilder outputBuilder = new SiteHealthOutputBuilder();
481 outputBuilder.setStatus(statusCode);
482 outputBuilder.setSites((List) new ArrayList<Site>());
484 if(siteConfiguration != SiteConfiguration.Geo) {
486 SitesBuilder builder = new SitesBuilder();
487 for(String key : members.keySet()) {
488 if(members.get(key).isUp() && !members.get(key).isUnreachable()) {
492 if(siteConfiguration != SiteConfiguration.Solo) {
493 builder.setHealth(HEALTHY);
494 builder.setRole("ACTIVE");
495 builder.setId(SITE_IDENTIFIER);
498 builder = getSitesBuilder(healthyODLs, true, HEALTHY.equals(adminHealth), HEALTHY.equals(databaseHealth), SITE_IDENTIFIER);
500 outputBuilder.getSites().add(builder.build());
503 int site1HealthyODLs = 0;
504 int site2HealthyODLs = 0;
505 boolean site1Voting = false;
506 boolean site2Voting = false;
507 boolean performedCrossSiteHealthCheck = false;
508 boolean crossSiteAdminHealthy = false;
509 boolean crossSiteDbHealthy = false;
510 String crossSiteIdentifier = "UNKNOWN_SITE";
511 String port = "true".equals(properties.getProperty("controller.useSsl")) ? properties.getProperty("controller.port.ssl") : properties.getProperty("controller.port.http");
513 // Make calls over to site 2 healthchecks
514 for(String key : members.keySet()) {
515 if(members.get(key).isUp() && !members.get(key).isUnreachable()) {
516 if(ClusterActor.SITE_1.equals(members.get(key).getSite())) {
518 if(members.get(key).isVoting()) {
524 if(members.get(key).isVoting()) {
527 if(!performedCrossSiteHealthCheck) {
529 String content = getRequestContent(HTTP_PROTOCOL + members.get(key).getNode() + ":" + port + "/restconf/operations/gr-toolkit:site-identifier", HttpMethod.Post);
530 crossSiteIdentifier = new JSONObject(content).getJSONObject("output").getString("id");
531 crossSiteDbHealthy = crossSiteHealthRequest(HTTP_PROTOCOL + members.get(key).getNode() + ":" + port + "/restconf/operations/gr-toolkit:database-health");
532 crossSiteAdminHealthy = crossSiteHealthRequest(HTTP_PROTOCOL + members.get(key).getNode() + ":" + port + "/restconf/operations/gr-toolkit:admin-health");
533 performedCrossSiteHealthCheck = true;
534 } catch(Exception e) {
535 log.error("Cannot get site identifier from " + members.get(key).getNode(), e);
541 SitesBuilder builder = getSitesBuilder(site1HealthyODLs, site1Voting, HEALTHY.equals(adminHealth), HEALTHY.equals(databaseHealth), SITE_IDENTIFIER);
542 outputBuilder.getSites().add(builder.build());
543 builder = getSitesBuilder(site2HealthyODLs, site2Voting, crossSiteAdminHealthy, crossSiteDbHealthy, crossSiteIdentifier);
544 outputBuilder.getSites().add(builder.build());
547 // Make calls over to site 1 healthchecks
548 for(String key : members.keySet()) {
549 if(members.get(key).isUp() && !members.get(key).isUnreachable()) {
550 if(ClusterActor.SITE_1.equals(members.get(key).getSite())) {
552 if(members.get(key).isVoting()) {
555 if(!performedCrossSiteHealthCheck) {
557 String content = getRequestContent(HTTP_PROTOCOL + members.get(key).getNode() + ":" + port + "/restconf/operations/gr-toolkit:site-identifier", HttpMethod.Post);
558 crossSiteIdentifier = new JSONObject(content).getJSONObject("output").getString("id");
559 crossSiteDbHealthy = crossSiteHealthRequest(HTTP_PROTOCOL + members.get(key).getNode() + ":" + port + "/restconf/operations/gr-toolkit:database-health");
560 crossSiteAdminHealthy = crossSiteHealthRequest(HTTP_PROTOCOL + members.get(key).getNode() + ":" + port + "/restconf/operations/gr-toolkit:admin-health");
561 performedCrossSiteHealthCheck = true;
562 } catch(Exception e) {
563 log.error("Cannot get site identifier from " + members.get(key).getNode(), e);
569 if(members.get(key).isVoting()) {
576 SitesBuilder builder = getSitesBuilder(site1HealthyODLs, site1Voting, crossSiteAdminHealthy, crossSiteDbHealthy, crossSiteIdentifier);
577 outputBuilder.getSites().add(builder.build());
578 builder = getSitesBuilder(site2HealthyODLs, site2Voting, HEALTHY.equals(adminHealth), HEALTHY.equals(databaseHealth), SITE_IDENTIFIER);
579 outputBuilder.getSites().add(builder.build());
583 RpcResult<SiteHealthOutput> rpcResult = RpcResultBuilder.<SiteHealthOutput>status(true).withResult(outputBuilder.build()).build();
584 return Futures.immediateFuture(rpcResult);
587 private SitesBuilder getSitesBuilder(int siteHealthyODLs, boolean siteVoting, boolean adminHealthy, boolean dbHealthy, String siteIdentifier) {
588 SitesBuilder builder = new SitesBuilder();
589 if(siteHealthyODLs > 1) {
590 builder.setHealth(HEALTHY);
593 log.warn(siteIdentifier + " Healthy ODLs: " + siteHealthyODLs);
594 builder.setHealth(FAULTY);
597 log.warn(siteIdentifier + " Admin Health: " + FAULTY);
598 builder.setHealth(FAULTY);
601 log.warn(siteIdentifier + " Database Health: " + FAULTY);
602 builder.setHealth(FAULTY);
605 builder.setRole("ACTIVE");
608 builder.setRole("STANDBY");
610 builder.setId(siteIdentifier);
614 private boolean isSite1() {
615 int memberNumber = Integer.parseInt(member.split("-")[1]);
616 boolean isSite1 = memberNumber < 4;
617 log.info("isSite1(): " + isSite1);
621 private void parseSeedNodes(String line) {
622 members = new HashMap<>();
623 line = line.substring(line.indexOf("[\""), line.indexOf("]"));
624 String[] splits = line.split(",");
626 for(int ndx = 0; ndx < splits.length; ndx++) {
627 String nodeName = splits[ndx];
628 int delimLocation = nodeName.indexOf("@");
629 String port = nodeName.substring(splits[ndx].indexOf(":", delimLocation) + 1, splits[ndx].indexOf("\"", splits[ndx].indexOf(":")));
630 splits[ndx] = nodeName.substring(delimLocation + 1, splits[ndx].indexOf(":", delimLocation));
631 log.info("Adding node: " + splits[ndx] + ":" + port);
632 ClusterActor clusterActor = new ClusterActor();
633 clusterActor.setNode(splits[ndx]);
634 clusterActor.setAkkaPort(port);
635 clusterActor.setMember("member-" + (ndx + 1));
637 clusterActor.setSite(ClusterActor.SITE_1);
640 clusterActor.setSite(ClusterActor.SITE_2);
643 if(member.equals(clusterActor.getMember())) {
646 members.put(clusterActor.getNode(), clusterActor);
647 log.info(clusterActor.toString());
650 if(members.size() == 1) {
651 log.info("1 member found. This is a solo environment.");
652 siteConfiguration = SiteConfiguration.Solo;
654 else if(members.size() == 3) {
655 log.info("This is a single site.");
656 siteConfiguration = SiteConfiguration.Single;
658 else if(members.size() == 6) {
659 log.info("This is a georedundant site.");
660 siteConfiguration = SiteConfiguration.Geo;
664 private void getMemberStatus(ClusterActor clusterActor) throws IOException {
665 log.info("Getting member status for " + clusterActor.getNode());
666 String content = getRequestContent(HTTP_PROTOCOL + clusterActor.getNode() + JOLOKIA_CLUSTER_PATH, HttpMethod.Get);
668 JSONObject responseJson = new JSONObject(content);
669 JSONObject responseValue = responseJson.getJSONObject("value");
670 clusterActor.setUp("Up".equals(responseValue.getString("MemberStatus")));
671 clusterActor.setUnreachable(false);
672 } catch(JSONException e) {
673 log.error("Error parsing response from " + clusterActor.getNode(), e);
674 clusterActor.setUp(false);
675 clusterActor.setUnreachable(true);
679 private void getShardStatus(ClusterActor clusterActor) throws IOException {
680 log.info("Getting shard status for " + clusterActor.getNode());
681 String content = getRequestContent(HTTP_PROTOCOL + clusterActor.getNode() + SHARD_MANAGER_PATH, HttpMethod.Get);
683 JSONObject responseValue = new JSONObject(content).getJSONObject("value");
684 JSONArray shardList = responseValue.getJSONArray("LocalShards");
686 String pattern = "-config$";
687 Pattern r = Pattern.compile(pattern);
689 for(int ndx = 0; ndx < shardList.length(); ndx++) {
690 String configShardName = shardList.getString(ndx);
691 m = r.matcher(configShardName);
692 String operationalShardName = m.replaceFirst("-operational");
693 String shardConfigPath = String.format(SHARD_PATH_TEMPLATE, configShardName);
694 String shardOperationalPath = String.format(SHARD_PATH_TEMPLATE, operationalShardName).replace("Config", "Operational");
695 extractShardInfo(clusterActor, configShardName, shardConfigPath);
696 extractShardInfo(clusterActor, operationalShardName, shardOperationalPath);
698 } catch(JSONException e) {
699 log.error("Error parsing response from " + clusterActor.getNode(), e);
703 private void extractShardInfo(ClusterActor clusterActor, String shardName, String shardPath) throws IOException {
704 log.info("Extracting shard info for " + shardName);
705 log.debug("Pulling config info for " + shardName + " from: " + shardPath);
706 String content = getRequestContent(HTTP_PROTOCOL + clusterActor.getNode() + shardPath, HttpMethod.Get);
707 log.debug("Response: " + content);
710 JSONObject shardValue = new JSONObject(content).getJSONObject("value");
711 clusterActor.setVoting(shardValue.getBoolean("Voting"));
712 if(shardValue.getString("PeerAddresses").length() > 0) {
713 clusterActor.getReplicaShards().add(shardName);
714 if(shardValue.getString("Leader").startsWith(clusterActor.getMember())) {
715 clusterActor.getShardLeader().add(shardName);
719 clusterActor.getNonReplicaShards().add(shardName);
721 JSONArray followerInfo = shardValue.getJSONArray("FollowerInfo");
722 for(int followerNdx = 0; followerNdx < followerInfo.length(); followerNdx++) {
723 int commitIndex = shardValue.getInt("CommitIndex");
724 int matchIndex = followerInfo.getJSONObject(followerNdx).getInt("matchIndex");
725 if(commitIndex != -1 && matchIndex != -1) {
726 int commitsBehind = commitIndex - matchIndex;
727 clusterActor.getCommits().put(followerInfo.getJSONObject(followerNdx).getString("id"), commitsBehind);
730 } catch(JSONException e) {
731 log.error("Error parsing response from " + clusterActor.getNode(), e);
735 private void getControllerHealth() {
736 ClusterActor clusterActor;
737 for(String key : members.keySet()) {
739 clusterActor = members.get(key);
740 // First flush out the old values
741 clusterActor.flush();
742 log.info("Gathering info for " + clusterActor.getNode());
743 getMemberStatus(clusterActor);
744 getShardStatus(clusterActor);
745 log.info("MemberInfo:\n" + clusterActor.toString());
746 } catch(IOException e) {
747 log.error("Connection Error", e);
748 members.get(key).setUnreachable(true);
749 members.get(key).setUp(false);
750 log.info("MemberInfo:\n" + members.get(key).toString());
755 private void modifyIpTables(IpTables task, Object[] nodeInfo) {
756 log.info("Modifying IPTables rules...");
760 for(Object node : nodeInfo) {
761 org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.halt.akka.traffic.input.NodeInfo n =
762 (org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.halt.akka.traffic.input.NodeInfo) node;
763 log.info("Isolating " + n.getNode());
764 executeCommand(String.format("sudo /sbin/iptables -A INPUT -p tcp --destination-port %s -j DROP -s %s", properties.get("controller.port.akka"), n.getNode()));
765 executeCommand(String.format("sudo /sbin/iptables -A OUTPUT -p tcp --destination-port %s -j DROP -s %s", n.getPort(), n.getNode()));
769 for(Object node : nodeInfo) {
770 org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.resume.akka.traffic.input.NodeInfo n =
771 (org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.resume.akka.traffic.input.NodeInfo) node;
772 log.info("De-isolating " + n.getNode());
773 executeCommand(String.format("sudo /sbin/iptables -D INPUT -p tcp --destination-port %s -j DROP -s %s", properties.get("controller.port.akka"), n.getNode()));
774 executeCommand(String.format("sudo /sbin/iptables -D OUTPUT -p tcp --destination-port %s -j DROP -s %s", n.getPort(), n.getNode()));
778 executeCommand("sudo /sbin/iptables -L");
781 private void executeCommand(String command) {
782 log.info("Executing command: " + command);
783 String[] cmd = command.split(" ");
785 Process p = Runtime.getRuntime().exec(cmd);
786 BufferedReader bufferedReader = new BufferedReader(new InputStreamReader(p.getInputStream()));
788 StringBuffer content = new StringBuffer();
789 while((inputLine = bufferedReader.readLine()) != null) {
790 content.append(inputLine);
792 bufferedReader.close();
793 log.info(content.toString());
794 } catch(IOException e) {
795 log.error("Error executing command", e);
799 private boolean crossSiteHealthRequest(String path) throws IOException {
800 String content = getRequestContent(path, HttpMethod.Post);
802 JSONObject responseJson = new JSONObject(content);
803 JSONObject responseValue = responseJson.getJSONObject("value");
804 return HEALTHY.equals(responseValue.getString("health"));
805 } catch(JSONException e) {
806 log.error("Error parsing JSON", e);
807 throw new IOException();
811 private String getAdminHealth() {
812 String protocol = "true".equals(properties.getProperty("adm.useSsl")) ? "https://" : "http://";
813 String port = "true".equals(properties.getProperty("adm.useSsl")) ? properties.getProperty("adm.port.ssl") : properties.getProperty("adm.port.http");
814 String path = protocol + properties.getProperty("adm.fqdn") + ":" + port + properties.getProperty("adm.healthcheck");
815 log.info("Requesting healthcheck from " + path);
817 int response = getRequestStatus(path, HttpMethod.Get);
818 log.info("Response: " + response);
822 } catch(IOException e) {
823 log.error("Problem getting ADM health.", e);
828 private String getDatabaseHealth() {
829 log.info("Determining database health...");
831 log.info("DBLib isActive(): " + dbLib.isActive());
832 log.info("DBLib isReadOnly(): " + dbLib.getConnection().isReadOnly());
833 log.info("DBLib isClosed(): " + dbLib.getConnection().isClosed());
834 if(!dbLib.isActive() || dbLib.getConnection().isClosed() || dbLib.getConnection().isReadOnly()) {
835 log.warn("Database is FAULTY");
838 log.info("Database is HEALTHY");
839 } catch(SQLException e) {
840 log.error("Database is FAULTY");
841 log.error("Error", e);
848 private String getRequestContent(String path, HttpMethod method) throws IOException {
849 return getRequestContent(path, method, null);
852 private String getRequestContent(String path, HttpMethod method, String input) throws IOException {
853 HttpURLConnection connection = getConnection(path);
854 connection.setRequestMethod(method.getMethod());
855 connection.setDoInput(true);
858 sendPayload(input, connection);
861 BufferedReader bufferedReader = new BufferedReader(new InputStreamReader(connection.getInputStream()));
863 StringBuffer content = new StringBuffer();
864 while((inputLine = bufferedReader.readLine()) != null) {
865 content.append(inputLine);
867 bufferedReader.close();
868 connection.disconnect();
869 return content.toString();
872 private int getRequestStatus(String path, HttpMethod method) throws IOException {
873 return getRequestStatus(path, method, null);
876 private int getRequestStatus(String path, HttpMethod method, String input) throws IOException {
877 HttpURLConnection connection = getConnection(path);
878 connection.setRequestMethod(method.getMethod());
879 connection.setDoInput(true);
882 sendPayload(input, connection);
884 int response = connection.getResponseCode();
885 log.info("Received " + response + " response code from " + path);
886 connection.disconnect();
890 private void sendPayload(String input, HttpURLConnection connection) throws IOException {
891 byte[] out = input.getBytes(StandardCharsets.UTF_8);
892 int length = out.length;
894 connection.setFixedLengthStreamingMode(length);
895 connection.setRequestProperty("Content-Type", "application/json");
896 connection.setDoOutput(true);
897 connection.connect();
898 try(OutputStream os = connection.getOutputStream()) {
903 private HttpURLConnection getConnection(String host) throws IOException {
904 log.info("Getting connection to: " + host);
905 URL url = new URL(host);
906 String auth = "Basic " + javax.xml.bind.DatatypeConverter.printBase64Binary(CREDENTIALS.getBytes());
907 HttpURLConnection connection = (HttpURLConnection) url.openConnection();
908 connection.addRequestProperty("Authorization", auth);
909 connection.setRequestProperty("Connection", "keep-alive");
910 connection.setRequestProperty("Proxy-Connection", "keep-alive");
914 private enum IpTables {
919 private enum SiteConfiguration {
925 private enum HttpMethod {
929 private String method;
930 HttpMethod(String method) {
931 this.method = method;
933 public String getMethod() {