2 * ============LICENSE_START=======================================================
4 * ================================================================================
5 * Copyright (C) 2018 AT&T Intellectual Property. All rights
7 * ================================================================================
8 * Licensed under the Apache License, Version 2.0 (the "License");
9 * you may not use this file except in compliance with the License.
10 * You may obtain a copy of the License at
12 * http://www.apache.org/licenses/LICENSE-2.0
14 * Unless required by applicable law or agreed to in writing, software
15 * distributed under the License is distributed on an "AS IS" BASIS,
16 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
17 * See the License for the specific language governing permissions and
18 * limitations under the License.
19 * ============LICENSE_END=========================================================
22 package org.onap.ccsdk.sli.plugins.grtoolkit;
24 import java.io.BufferedReader;
26 import java.io.FileInputStream;
27 import java.io.FileReader;
28 import java.io.IOException;
29 import java.io.InputStreamReader;
30 import java.io.OutputStream;
31 import java.net.HttpURLConnection;
33 import java.nio.charset.StandardCharsets;
34 import java.sql.Connection;
35 import java.sql.SQLException;
36 import java.util.ArrayList;
37 import java.util.Collection;
38 import java.util.HashMap;
40 import java.util.Properties;
41 import java.util.List;
42 import java.util.concurrent.ExecutorService;
43 import java.util.concurrent.Executors;
44 import java.util.regex.Matcher;
45 import java.util.regex.Pattern;
46 import javax.annotation.Nonnull;
48 import com.google.common.util.concurrent.Futures;
49 import com.google.common.util.concurrent.ListenableFuture;
51 import org.onap.ccsdk.sli.core.dblib.DBLibConnection;
52 import org.onap.ccsdk.sli.core.dblib.DbLibService;
53 import org.onap.ccsdk.sli.plugins.grtoolkit.data.ClusterActor;
54 import org.onap.ccsdk.sli.plugins.grtoolkit.data.MemberBuilder;
56 import org.json.JSONArray;
57 import org.json.JSONException;
58 import org.json.JSONObject;
60 import org.opendaylight.controller.cluster.datastore.DistributedDataStoreInterface;
61 import org.opendaylight.controller.md.sal.binding.api.DataBroker;
62 import org.opendaylight.controller.md.sal.binding.api.DataTreeChangeListener;
63 import org.opendaylight.controller.md.sal.binding.api.NotificationPublishService;
64 import org.opendaylight.controller.sal.binding.api.BindingAwareBroker;
65 import org.opendaylight.controller.sal.binding.api.RpcProviderRegistry;
66 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.AdminHealthInput;
67 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.AdminHealthOutput;
68 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.AdminHealthOutputBuilder;
69 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ClusterHealthInput;
70 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ClusterHealthOutput;
71 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ClusterHealthOutputBuilder;
72 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.DatabaseHealthInput;
73 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.DatabaseHealthOutput;
74 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.DatabaseHealthOutputBuilder;
75 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.FailoverInput;
76 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.FailoverOutput;
77 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.FailoverOutputBuilder;
78 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.GrToolkitService;
79 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.HaltAkkaTrafficInput;
80 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.HaltAkkaTrafficOutput;
81 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.HaltAkkaTrafficOutputBuilder;
82 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.Member;
83 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ResumeAkkaTrafficInput;
84 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ResumeAkkaTrafficOutput;
85 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.ResumeAkkaTrafficOutputBuilder;
86 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.Site;
87 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteHealthInput;
88 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteHealthOutput;
89 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteHealthOutputBuilder;
90 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteIdentifierInput;
91 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteIdentifierOutput;
92 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.SiteIdentifierOutputBuilder;
93 import org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.site.health.output.SitesBuilder;
94 import org.opendaylight.yangtools.yang.common.RpcResult;
95 import org.opendaylight.yangtools.yang.common.RpcResultBuilder;
97 import org.slf4j.Logger;
98 import org.slf4j.LoggerFactory;
100 public class GrToolkitProvider implements AutoCloseable, GrToolkitService, DataTreeChangeListener {
101 private static final String APP_NAME = "gr-toolkit";
102 private static final String PROPERTIES_FILE = System.getenv("SDNC_CONFIG_DIR") + "/gr-toolkit.properties";
103 private static final String HEALTHY = "HEALTHY";
104 private static final String FAULTY = "FAULTY";
105 private static final String VALUE = "value";
106 private String akkaConfig;
107 private String jolokiaClusterPath;
108 private String shardManagerPath;
109 private String shardPathTemplate;
110 private String credentials;
111 private String httpProtocol;
112 private String siteIdentifier = System.getenv("SITE_NAME");
113 private final Logger log = LoggerFactory.getLogger(GrToolkitProvider.class);
114 private final ExecutorService executor;
115 protected DataBroker dataBroker;
116 protected NotificationPublishService notificationService;
117 protected RpcProviderRegistry rpcRegistry;
118 protected BindingAwareBroker.RpcRegistration<GrToolkitService> rpcRegistration;
119 protected DbLibService dbLib;
120 private String member;
121 private ClusterActor self;
122 private HashMap<String, ClusterActor> memberMap;
123 private SiteConfiguration siteConfiguration;
124 private Properties properties;
125 private DistributedDataStoreInterface configDatastore;
126 public GrToolkitProvider(DataBroker dataBroker,
127 NotificationPublishService notificationProviderService,
128 RpcProviderRegistry rpcProviderRegistry,
129 DistributedDataStoreInterface configDatastore,
130 DbLibService dbLibService) {
131 this.log.info("Creating provider for {}", APP_NAME);
132 this.executor = Executors.newFixedThreadPool(1);
133 this.dataBroker = dataBroker;
134 this.notificationService = notificationProviderService;
135 this.rpcRegistry = rpcProviderRegistry;
136 this.configDatastore = configDatastore;
137 this.dbLib = dbLibService;
141 private void initialize() {
142 log.info("Initializing provider for {}", APP_NAME);
143 // Create the top level containers
148 rpcRegistration = rpcRegistry.addRpcImplementation(GrToolkitService.class, this);
149 log.info("Initialization complete for {}", APP_NAME);
152 private void setProperties() {
153 log.info("Loading properties from {}", PROPERTIES_FILE);
154 properties = new Properties();
155 File propertiesFile = new File(PROPERTIES_FILE);
156 if(!propertiesFile.exists()) {
157 log.warn("Properties file not found.");
160 try(FileInputStream fileInputStream = new FileInputStream(propertiesFile)) {
161 properties.load(fileInputStream);
162 if(!properties.containsKey(PropertyKeys.SITE_IDENTIFIER)) {
163 properties.put(PropertyKeys.SITE_IDENTIFIER, "Unknown Site");
165 String port = "true".equals(properties.getProperty(PropertyKeys.CONTROLLER_USE_SSL).trim()) ? properties.getProperty(PropertyKeys.CONTROLLER_PORT_SSL).trim() : properties.getProperty(PropertyKeys.CONTROLLER_PORT_HTTP).trim();
166 httpProtocol = "true".equals(properties.getProperty(PropertyKeys.CONTROLLER_USE_SSL).trim()) ? "https://" : "http://";
167 akkaConfig = properties.getProperty(PropertyKeys.AKKA_CONF_LOCATION).trim();
168 jolokiaClusterPath = ":" + port + properties.getProperty(PropertyKeys.MBEAN_CLUSTER).trim();
169 shardManagerPath = ":" + port + properties.getProperty(PropertyKeys.MBEAN_SHARD_MANAGER).trim();
170 shardPathTemplate = ":" + port + properties.getProperty(PropertyKeys.MBEAN_SHARD_CONFIG).trim();
171 if(siteIdentifier == null || siteIdentifier.isEmpty()) {
172 siteIdentifier = properties.getProperty(PropertyKeys.SITE_IDENTIFIER).trim();
174 credentials = properties.getProperty(PropertyKeys.CONTROLLER_CREDENTIALS).trim();
175 log.info("Loaded properties.");
176 } catch(IOException e) {
177 log.error("Error loading properties.", e);
181 private void defineMembers() {
182 member = configDatastore.getActorContext().getCurrentMemberName().getName();
183 log.info("Cluster member: {}", member);
185 log.info("Parsing akka.conf for cluster memberMap...");
187 File akkaConfigFile = new File(this.akkaConfig);
188 try(FileReader fileReader = new FileReader(akkaConfigFile);
189 BufferedReader bufferedReader = new BufferedReader(fileReader)) {
191 while((line = bufferedReader.readLine()) != null) {
192 if(line.contains("seed-nodes =")) {
193 parseSeedNodes(line);
198 } catch(IOException e) {
199 log.error("Couldn't load akka", e);
200 } catch(NullPointerException e) {
201 log.error("akkaConfig is null. Check properties file and restart {} bundle.", APP_NAME);
203 log.info("self:\n{}", self);
206 private void createContainers() {
207 // Replace with MD-SAL write for FailoverStatus
210 protected void initializeChild() {
211 // Override if you have custom initialization intelligence
215 public void close() throws Exception {
216 log.info("Closing provider for {}", APP_NAME);
218 rpcRegistration.close();
219 log.info("Successfully closed provider for {}", APP_NAME);
223 public void onDataTreeChanged(@Nonnull Collection changes) {
224 log.info("onDataTreeChanged() called. but there is no change here");
228 public ListenableFuture<RpcResult<ClusterHealthOutput>> clusterHealth(ClusterHealthInput input) {
229 log.info("{}:cluster-health invoked.", APP_NAME);
230 getControllerHealth();
231 return buildClusterHealthOutput("200");
235 public ListenableFuture<RpcResult<SiteHealthOutput>> siteHealth(SiteHealthInput input) {
236 log.info("{}:site-health invoked.", APP_NAME);
237 getControllerHealth();
238 return buildSiteHealthOutput("200", getAdminHealth(), getDatabaseHealth());
242 public ListenableFuture<RpcResult<DatabaseHealthOutput>> databaseHealth(DatabaseHealthInput input) {
243 log.info("{}:database-health invoked.", APP_NAME);
244 DatabaseHealthOutputBuilder outputBuilder = new DatabaseHealthOutputBuilder();
245 outputBuilder.setStatus("200");
246 outputBuilder.setHealth(getDatabaseHealth());
247 outputBuilder.setServedBy(member);
249 return Futures.immediateFuture(RpcResultBuilder.<DatabaseHealthOutput>status(true).withResult(outputBuilder.build()).build());
253 public ListenableFuture<RpcResult<AdminHealthOutput>> adminHealth(AdminHealthInput input) {
254 log.info("{}:admin-health invoked.", APP_NAME);
255 AdminHealthOutputBuilder outputBuilder = new AdminHealthOutputBuilder();
256 outputBuilder.setStatus("200");
257 outputBuilder.setHealth(getAdminHealth());
258 outputBuilder.setServedBy(member);
260 return Futures.immediateFuture(RpcResultBuilder.<AdminHealthOutput>status(true).withResult(outputBuilder.build()).build());
264 public ListenableFuture<RpcResult<HaltAkkaTrafficOutput>> haltAkkaTraffic(HaltAkkaTrafficInput input) {
265 log.info("{}:halt-akka-traffic invoked.", APP_NAME);
266 HaltAkkaTrafficOutputBuilder outputBuilder = new HaltAkkaTrafficOutputBuilder();
267 outputBuilder.setStatus("200");
268 modifyIpTables(IpTables.ADD, input.getNodeInfo().toArray());
269 outputBuilder.setServedBy(member);
271 return Futures.immediateFuture(RpcResultBuilder.<HaltAkkaTrafficOutput>status(true).withResult(outputBuilder.build()).build());
275 public ListenableFuture<RpcResult<ResumeAkkaTrafficOutput>> resumeAkkaTraffic(ResumeAkkaTrafficInput input) {
276 log.info("{}:resume-akka-traffic invoked.", APP_NAME);
277 ResumeAkkaTrafficOutputBuilder outputBuilder = new ResumeAkkaTrafficOutputBuilder();
278 outputBuilder.setStatus("200");
279 modifyIpTables(IpTables.DELETE, input.getNodeInfo().toArray());
280 outputBuilder.setServedBy(member);
282 return Futures.immediateFuture(RpcResultBuilder.<ResumeAkkaTrafficOutput>status(true).withResult(outputBuilder.build()).build());
286 public ListenableFuture<RpcResult<SiteIdentifierOutput>> siteIdentifier(SiteIdentifierInput input) {
287 log.info("{}:site-identifier invoked.", APP_NAME);
288 SiteIdentifierOutputBuilder outputBuilder = new SiteIdentifierOutputBuilder();
289 outputBuilder.setStatus("200");
290 outputBuilder.setId(siteIdentifier);
291 outputBuilder.setServedBy(member);
293 return Futures.immediateFuture(RpcResultBuilder.<SiteIdentifierOutput>status(true).withResult(outputBuilder.build()).build());
297 public ListenableFuture<RpcResult<FailoverOutput>> failover(FailoverInput input) {
298 log.info("{}:failover invoked.", APP_NAME);
299 FailoverOutputBuilder outputBuilder = new FailoverOutputBuilder();
300 outputBuilder.setServedBy(member);
301 if(siteConfiguration != SiteConfiguration.GEO) {
302 log.info("Cannot failover non-GEO site.");
303 outputBuilder.setMessage("Failover aborted. This is not a GEO configuration.");
304 outputBuilder.setStatus("400");
305 return Futures.immediateFuture(RpcResultBuilder.<FailoverOutput>status(true).withResult(outputBuilder.build()).build());
307 ArrayList<ClusterActor> activeSite = new ArrayList<>();
308 ArrayList<ClusterActor> standbySite = new ArrayList<>();
310 log.info("Performing preliminary cluster health check...");
311 // Necessary to populate all member info. Health is not used for judgement calls.
312 getControllerHealth();
314 log.info("Determining active site...");
315 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
316 String key = entry.getKey();
317 ClusterActor clusterActor = entry.getValue();
318 if(clusterActor.isVoting()) {
319 activeSite.add(clusterActor);
320 log.debug("Active Site member: {}", key);
323 standbySite.add(clusterActor);
324 log.debug("Standby Site member: {}", key);
328 String port = "true".equals(properties.getProperty(PropertyKeys.CONTROLLER_USE_SSL)) ? properties.getProperty(PropertyKeys.CONTROLLER_PORT_SSL) : properties.getProperty(PropertyKeys.CONTROLLER_PORT_HTTP);
330 if(Boolean.parseBoolean(input.getBackupData())) {
331 backupMdSal(activeSite, port);
334 if(!changeClusterVoting(outputBuilder, activeSite, standbySite, port))
335 return Futures.immediateFuture(RpcResultBuilder.<FailoverOutput>status(true).withResult(outputBuilder.build()).build());
337 if(Boolean.parseBoolean(input.getIsolate())) {
338 isolateSiteFromCluster(activeSite, standbySite, port);
340 if(Boolean.parseBoolean(input.getDownUnreachable())) {
341 downUnreachableNodes(activeSite, standbySite, port);
345 log.info("{}:failover complete.", APP_NAME);
347 outputBuilder.setMessage("Failover complete.");
348 outputBuilder.setStatus("200");
349 return Futures.immediateFuture(RpcResultBuilder.<FailoverOutput>status(true).withResult(outputBuilder.build()).build());
352 private void isolateSiteFromCluster(ArrayList<ClusterActor> activeSite, ArrayList<ClusterActor> standbySite, String port) {
353 log.info("Halting Akka traffic...");
354 for(ClusterActor actor : standbySite) {
356 log.info("Halting Akka traffic for: {}", actor.getNode());
357 // Build JSON with activeSite actor Node and actor AkkaPort
358 JSONObject akkaInput = new JSONObject();
359 JSONObject inputBlock = new JSONObject();
360 JSONArray votingStateArray = new JSONArray();
362 for(ClusterActor node : activeSite) {
363 nodeInfo = new JSONObject();
364 nodeInfo.put("node", node.getNode());
365 nodeInfo.put("port", node.getAkkaPort());
366 votingStateArray.put(nodeInfo);
368 inputBlock.put("node-info", votingStateArray);
369 akkaInput.put("input", inputBlock);
370 getRequestContent(httpProtocol + actor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:halt-akka-traffic", HttpMethod.POST, akkaInput.toString());
371 } catch(IOException e) {
372 log.error("Could not halt Akka traffic for: " + actor.getNode(), e);
377 private void downUnreachableNodes(ArrayList<ClusterActor> activeSite, ArrayList<ClusterActor> standbySite, String port) {
378 log.info("Setting site unreachable...");
379 JSONObject jolokiaInput = new JSONObject();
380 jolokiaInput.put("type", "EXEC");
381 jolokiaInput.put("mbean", "akka:type=Cluster");
382 jolokiaInput.put("operation", "down");
383 JSONArray arguments = new JSONArray();
384 for(ClusterActor actor : activeSite) {
385 // Build Jolokia input
386 // May need to change from akka port to actor.getAkkaPort()
387 arguments.put("akka.tcp://opendaylight-cluster-data@" + actor.getNode() + ":" + properties.getProperty(PropertyKeys.CONTROLLER_PORT_AKKA));
389 jolokiaInput.put("arguments", arguments);
390 log.debug("{}", jolokiaInput);
392 log.info("Setting nodes unreachable");
393 getRequestContent(httpProtocol + standbySite.get(0).getNode() + ":" + port + "/jolokia", HttpMethod.POST, jolokiaInput.toString());
394 } catch(IOException e) {
395 log.error("Error setting nodes unreachable", e);
399 private boolean changeClusterVoting(FailoverOutputBuilder outputBuilder, ArrayList<ClusterActor> activeSite, ArrayList<ClusterActor> standbySite, String port) {
400 log.info("Changing voting for all shards to standby site...");
402 JSONObject votingInput = new JSONObject();
403 JSONObject inputBlock = new JSONObject();
404 JSONArray votingStateArray = new JSONArray();
405 JSONObject memberVotingState;
406 for(ClusterActor actor : activeSite) {
407 memberVotingState = new JSONObject();
408 memberVotingState.put("member-name", actor.getMember());
409 memberVotingState.put("voting", false);
410 votingStateArray.put(memberVotingState);
412 for(ClusterActor actor : standbySite) {
413 memberVotingState = new JSONObject();
414 memberVotingState.put("member-name", actor.getMember());
415 memberVotingState.put("voting", true);
416 votingStateArray.put(memberVotingState);
418 inputBlock.put("member-voting-state", votingStateArray);
419 votingInput.put("input", inputBlock);
420 log.debug("{}", votingInput);
421 // Change voting all shards
422 getRequestContent(httpProtocol + self.getNode() + ":" + port + "/restconf/operations/cluster-admin:change-member-voting-states-for-all-shards", HttpMethod.POST, votingInput.toString());
423 } catch(IOException e) {
424 log.error("Changing voting", e);
425 outputBuilder.setMessage("Failover aborted. Failed to change voting.");
426 outputBuilder.setStatus("500");
432 private void backupMdSal(ArrayList<ClusterActor> activeSite, String port) {
433 log.info("Backing up data...");
435 log.info("Scheduling backup for: {}", activeSite.get(0).getNode());
436 getRequestContent(httpProtocol + activeSite.get(0).getNode() + ":" + port + "/restconf/operations/data-export-import:schedule-export", HttpMethod.POST, "{ \"input\": { \"run-at\": \"30\" } }");
437 } catch(IOException e) {
438 log.error("Error backing up MD-SAL", e);
440 for(ClusterActor actor : activeSite) {
443 log.info("Backing up data for: {}", actor.getNode());
444 getRequestContent(httpProtocol + actor.getNode() + ":" + port + "/restconf/operations/daexim-offsite-backup:backup-data", HttpMethod.POST);
445 } catch(IOException e) {
446 log.error("Error backing up data.", e);
451 private ListenableFuture<RpcResult<ClusterHealthOutput>> buildClusterHealthOutput(String statusCode) {
452 ClusterHealthOutputBuilder outputBuilder = new ClusterHealthOutputBuilder();
453 outputBuilder.setStatus(statusCode);
454 outputBuilder.setMembers((List) new ArrayList<Member>());
458 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
459 ClusterActor clusterActor = entry.getValue();
460 if(clusterActor.isUp() && !clusterActor.isUnreachable()) {
461 if(ClusterActor.SITE_1.equals(clusterActor.getSite()))
463 else if(ClusterActor.SITE_2.equals(clusterActor.getSite()))
466 outputBuilder.getMembers().add(new MemberBuilder(clusterActor).build());
468 if(siteConfiguration == SiteConfiguration.SOLO) {
469 outputBuilder.setSite1Health(HEALTHY);
471 else if(site1Health > 1) {
472 outputBuilder.setSite1Health(HEALTHY);
475 outputBuilder.setSite1Health(FAULTY);
478 if(siteConfiguration == SiteConfiguration.GEO && site2Health > 1) {
479 outputBuilder.setSite2Health(HEALTHY);
481 else if(siteConfiguration == SiteConfiguration.GEO) {
482 outputBuilder.setSite2Health(FAULTY);
485 outputBuilder.setServedBy(member);
486 RpcResult<ClusterHealthOutput> rpcResult = RpcResultBuilder.<ClusterHealthOutput>status(true).withResult(outputBuilder.build()).build();
487 return Futures.immediateFuture(rpcResult);
490 private ListenableFuture<RpcResult<SiteHealthOutput>> buildSiteHealthOutput(String statusCode, String adminHealth, String databaseHealth) {
491 SiteHealthOutputBuilder outputBuilder = new SiteHealthOutputBuilder();
492 outputBuilder.setStatus(statusCode);
493 outputBuilder.setSites((List) new ArrayList<Site>());
495 if(siteConfiguration != SiteConfiguration.GEO) {
497 SitesBuilder builder = new SitesBuilder();
498 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
499 ClusterActor clusterActor = entry.getValue();
500 if(clusterActor.isUp() && !clusterActor.isUnreachable()) {
504 if(siteConfiguration != SiteConfiguration.SOLO) {
505 builder.setHealth(HEALTHY);
506 builder.setRole("ACTIVE");
507 builder.setId(siteIdentifier);
510 builder = getSitesBuilder(healthyODLs, true, HEALTHY.equals(adminHealth), HEALTHY.equals(databaseHealth), siteIdentifier);
512 outputBuilder.getSites().add(builder.build());
515 int site1HealthyODLs = 0;
516 int site2HealthyODLs = 0;
517 boolean site1Voting = false;
518 boolean site2Voting = false;
519 boolean performedCrossSiteHealthCheck = false;
520 boolean crossSiteAdminHealthy = false;
521 boolean crossSiteDbHealthy = false;
522 String crossSiteIdentifier = "UNKNOWN_SITE";
523 String port = "true".equals(properties.getProperty(PropertyKeys.CONTROLLER_USE_SSL)) ? properties.getProperty(PropertyKeys.CONTROLLER_PORT_SSL) : properties.getProperty(PropertyKeys.CONTROLLER_PORT_HTTP);
525 // Make calls over to site 2 healthchecks
526 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
527 ClusterActor clusterActor = entry.getValue();
528 if(clusterActor.isUp() && !clusterActor.isUnreachable()) {
529 if(ClusterActor.SITE_1.equals(clusterActor.getSite())) {
531 if(clusterActor.isVoting()) {
537 if(clusterActor.isVoting()) {
540 if(!performedCrossSiteHealthCheck) {
542 String content = getRequestContent(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:site-identifier", HttpMethod.POST);
543 crossSiteIdentifier = new JSONObject(content).getJSONObject("output").getString("id");
544 crossSiteDbHealthy = crossSiteHealthRequest(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:database-health");
545 crossSiteAdminHealthy = crossSiteHealthRequest(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:admin-health");
546 performedCrossSiteHealthCheck = true;
547 } catch(Exception e) {
548 log.info("Cannot get site identifier from {}", clusterActor.getNode());
549 log.error("Site Health Error", e);
555 SitesBuilder builder = getSitesBuilder(site1HealthyODLs, site1Voting, HEALTHY.equals(adminHealth), HEALTHY.equals(databaseHealth), siteIdentifier);
556 outputBuilder.getSites().add(builder.build());
557 builder = getSitesBuilder(site2HealthyODLs, site2Voting, crossSiteAdminHealthy, crossSiteDbHealthy, crossSiteIdentifier);
558 outputBuilder.getSites().add(builder.build());
561 // Make calls over to site 1 healthchecks
562 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
563 ClusterActor clusterActor = entry.getValue();
564 if(clusterActor.isUp() && !clusterActor.isUnreachable()) {
565 if(ClusterActor.SITE_1.equals(clusterActor.getSite())) {
567 if(clusterActor.isVoting()) {
570 if(!performedCrossSiteHealthCheck) {
572 String content = getRequestContent(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:site-identifier", HttpMethod.POST);
573 crossSiteIdentifier = new JSONObject(content).getJSONObject("output").getString("id");
574 crossSiteDbHealthy = crossSiteHealthRequest(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:database-health");
575 crossSiteAdminHealthy = crossSiteHealthRequest(httpProtocol + clusterActor.getNode() + ":" + port + "/restconf/operations/gr-toolkit:admin-health");
576 performedCrossSiteHealthCheck = true;
577 } catch(Exception e) {
578 log.info("Cannot get site identifier from {}", clusterActor.getNode());
579 log.error("Site Health Error", e);
585 if(clusterActor.isVoting()) {
592 SitesBuilder builder = getSitesBuilder(site1HealthyODLs, site1Voting, crossSiteAdminHealthy, crossSiteDbHealthy, crossSiteIdentifier);
593 outputBuilder.getSites().add(builder.build());
594 builder = getSitesBuilder(site2HealthyODLs, site2Voting, HEALTHY.equals(adminHealth), HEALTHY.equals(databaseHealth), siteIdentifier);
595 outputBuilder.getSites().add(builder.build());
599 outputBuilder.setServedBy(member);
600 RpcResult<SiteHealthOutput> rpcResult = RpcResultBuilder.<SiteHealthOutput>status(true).withResult(outputBuilder.build()).build();
601 return Futures.immediateFuture(rpcResult);
604 private SitesBuilder getSitesBuilder(int siteHealthyODLs, boolean siteVoting, boolean adminHealthy, boolean dbHealthy, String siteIdentifier) {
605 SitesBuilder builder = new SitesBuilder();
606 if(siteHealthyODLs > 1) {
607 builder.setHealth(HEALTHY);
610 log.warn("{} Healthy ODLs: {}", siteIdentifier, siteHealthyODLs);
611 builder.setHealth(FAULTY);
614 log.warn("{} Admin Health: {}", siteIdentifier, FAULTY);
615 builder.setHealth(FAULTY);
618 log.warn("{} Database Health: {}", siteIdentifier, FAULTY);
619 builder.setHealth(FAULTY);
622 builder.setRole("ACTIVE");
625 builder.setRole("STANDBY");
627 builder.setId(siteIdentifier);
631 private boolean isSite1() {
632 int memberNumber = Integer.parseInt(member.split("-")[1]);
633 boolean isSite1 = memberNumber < 4;
634 log.info("isSite1(): {}", isSite1);
638 private void parseSeedNodes(String line) {
639 memberMap = new HashMap<>();
640 line = line.substring(line.indexOf("[\""), line.indexOf(']'));
641 String[] splits = line.split(",");
643 for(int ndx = 0; ndx < splits.length; ndx++) {
644 String nodeName = splits[ndx];
645 int delimLocation = nodeName.indexOf('@');
646 String port = nodeName.substring(splits[ndx].indexOf(':', delimLocation) + 1, splits[ndx].indexOf('"', splits[ndx].indexOf(':')));
647 splits[ndx] = nodeName.substring(delimLocation + 1, splits[ndx].indexOf(':', delimLocation));
648 log.info("Adding node: {}:{}", splits[ndx], port);
649 ClusterActor clusterActor = new ClusterActor();
650 clusterActor.setNode(splits[ndx]);
651 clusterActor.setAkkaPort(port);
652 clusterActor.setMember("member-" + (ndx + 1));
654 clusterActor.setSite(ClusterActor.SITE_1);
657 clusterActor.setSite(ClusterActor.SITE_2);
660 if(member.equals(clusterActor.getMember())) {
663 memberMap.put(clusterActor.getNode(), clusterActor);
664 log.info("{}", clusterActor);
667 if(memberMap.size() == 1) {
668 log.info("1 member found. This is a solo environment.");
669 siteConfiguration = SiteConfiguration.SOLO;
671 else if(memberMap.size() == 3) {
672 log.info("This is a single site.");
673 siteConfiguration = SiteConfiguration.SINGLE;
675 else if(memberMap.size() == 6) {
676 log.info("This is a georedundant site.");
677 siteConfiguration = SiteConfiguration.GEO;
681 private void getMemberStatus(ClusterActor clusterActor) throws IOException {
682 log.info("Getting member status for {}", clusterActor.getNode());
683 String content = getRequestContent(httpProtocol + clusterActor.getNode() + jolokiaClusterPath, HttpMethod.GET);
685 JSONObject responseJson = new JSONObject(content);
686 JSONObject responseValue = responseJson.getJSONObject(VALUE);
687 clusterActor.setUp("Up".equals(responseValue.getString("MemberStatus")));
688 clusterActor.setUnreachable(false);
689 } catch(JSONException e) {
690 log.error("Error parsing response from {}", clusterActor.getNode(), e);
691 clusterActor.setUp(false);
692 clusterActor.setUnreachable(true);
696 private void getShardStatus(ClusterActor clusterActor) throws IOException {
697 log.info("Getting shard status for {}", clusterActor.getNode());
698 String content = getRequestContent(httpProtocol + clusterActor.getNode() + shardManagerPath, HttpMethod.GET);
700 JSONObject responseValue = new JSONObject(content).getJSONObject(VALUE);
701 JSONArray shardList = responseValue.getJSONArray("LocalShards");
703 String pattern = "-config$";
704 Pattern r = Pattern.compile(pattern);
706 for(int ndx = 0; ndx < shardList.length(); ndx++) {
707 String configShardName = shardList.getString(ndx);
708 m = r.matcher(configShardName);
709 String operationalShardName = m.replaceFirst("-operational");
710 String shardConfigPath = String.format(shardPathTemplate, configShardName);
711 String shardOperationalPath = String.format(shardPathTemplate, operationalShardName).replace("Config", "Operational");
712 extractShardInfo(clusterActor, configShardName, shardConfigPath);
713 extractShardInfo(clusterActor, operationalShardName, shardOperationalPath);
715 } catch(JSONException e) {
716 log.error("Error parsing response from " + clusterActor.getNode(), e);
720 private void extractShardInfo(ClusterActor clusterActor, String shardName, String shardPath) throws IOException {
721 log.info("Extracting shard info for {}", shardName);
722 log.debug("Pulling config info for {} from: {}", shardName, shardPath);
723 String content = getRequestContent(httpProtocol + clusterActor.getNode() + shardPath, HttpMethod.GET);
724 log.debug("Response: {}", content);
727 JSONObject shardValue = new JSONObject(content).getJSONObject(VALUE);
728 clusterActor.setVoting(shardValue.getBoolean("Voting"));
729 if(shardValue.getString("PeerAddresses").length() > 0) {
730 clusterActor.getReplicaShards().add(shardName);
731 if(shardValue.getString("Leader").startsWith(clusterActor.getMember())) {
732 clusterActor.getShardLeader().add(shardName);
736 clusterActor.getNonReplicaShards().add(shardName);
738 JSONArray followerInfo = shardValue.getJSONArray("FollowerInfo");
739 for(int followerNdx = 0; followerNdx < followerInfo.length(); followerNdx++) {
740 int commitIndex = shardValue.getInt("CommitIndex");
741 int matchIndex = followerInfo.getJSONObject(followerNdx).getInt("matchIndex");
742 if(commitIndex != -1 && matchIndex != -1) {
743 int commitsBehind = commitIndex - matchIndex;
744 clusterActor.getCommits().put(followerInfo.getJSONObject(followerNdx).getString("id"), commitsBehind);
747 } catch(JSONException e) {
748 log.error("Error parsing response from " + clusterActor.getNode(), e);
752 private void getControllerHealth() {
753 for(Map.Entry<String, ClusterActor> entry : memberMap.entrySet()) {
754 ClusterActor clusterActor = entry.getValue();
755 String key = entry.getKey();
757 // First flush out the old values
758 clusterActor.flush();
759 log.info("Gathering info for {}", clusterActor.getNode());
760 getMemberStatus(clusterActor);
761 getShardStatus(clusterActor);
762 log.info("MemberInfo:\n{}", clusterActor);
763 } catch(IOException e) {
764 log.error("Connection Error", e);
765 memberMap.get(key).setUnreachable(true);
766 memberMap.get(key).setUp(false);
767 log.info("MemberInfo:\n{}", memberMap.get(key));
772 private void modifyIpTables(IpTables task, Object[] nodeInfo) {
773 log.info("Modifying IPTables rules...");
774 if(task == IpTables.ADD) {
775 for(Object node : nodeInfo) {
776 org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.halt.akka.traffic.input.NodeInfo n =
777 (org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.halt.akka.traffic.input.NodeInfo) node;
778 log.info("Isolating {}", n.getNode());
779 executeCommand(String.format("sudo /sbin/iptables -A INPUT -p tcp --destination-port %s -j DROP -s %s", properties.get(PropertyKeys.CONTROLLER_PORT_AKKA), n.getNode()));
780 executeCommand(String.format("sudo /sbin/iptables -A OUTPUT -p tcp --destination-port %s -j DROP -s %s", n.getPort(), n.getNode()));
783 } else if(task == IpTables.DELETE) {
784 for(Object node : nodeInfo) {
785 org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.resume.akka.traffic.input.NodeInfo n =
786 (org.opendaylight.yang.gen.v1.org.onap.ccsdk.sli.plugins.gr.toolkit.rev180926.resume.akka.traffic.input.NodeInfo) node;
787 log.info("De-isolating {}", n.getNode());
788 executeCommand(String.format("sudo /sbin/iptables -D INPUT -p tcp --destination-port %s -j DROP -s %s", properties.get(PropertyKeys.CONTROLLER_PORT_AKKA), n.getNode()));
789 executeCommand(String.format("sudo /sbin/iptables -D OUTPUT -p tcp --destination-port %s -j DROP -s %s", n.getPort(), n.getNode()));
793 executeCommand("sudo /sbin/iptables -L");
796 private void executeCommand(String command) {
797 log.info("Executing command: {}", command);
798 String[] cmd = command.split(" ");
800 Process p = Runtime.getRuntime().exec(cmd);
801 BufferedReader bufferedReader = new BufferedReader(new InputStreamReader(p.getInputStream()));
803 StringBuilder content = new StringBuilder();
804 while((inputLine = bufferedReader.readLine()) != null) {
805 content.append(inputLine);
807 bufferedReader.close();
808 log.info("{}", content);
809 } catch(IOException e) {
810 log.error("Error executing command", e);
814 private boolean crossSiteHealthRequest(String path) throws IOException {
815 String content = getRequestContent(path, HttpMethod.POST);
817 JSONObject responseJson = new JSONObject(content);
818 JSONObject responseValue = responseJson.getJSONObject(VALUE);
819 return HEALTHY.equals(responseValue.getString("health"));
820 } catch(JSONException e) {
821 log.error("Error parsing JSON", e);
822 throw new IOException();
826 private String getAdminHealth() {
827 String protocol = "true".equals(properties.getProperty(PropertyKeys.ADM_USE_SSL)) ? "https://" : "http://";
828 String port = "true".equals(properties.getProperty(PropertyKeys.ADM_USE_SSL)) ? properties.getProperty(PropertyKeys.ADM_PORT_SSL) : properties.getProperty(PropertyKeys.ADM_PORT_HTTP);
829 String path = protocol + properties.getProperty(PropertyKeys.ADM_FQDN) + ":" + port + properties.getProperty(PropertyKeys.ADM_HEALTHCHECK);
830 log.info("Requesting healthcheck from {}", path);
832 int response = getRequestStatus(path, HttpMethod.GET);
833 log.info("Response: {}", response);
837 } catch(IOException e) {
838 log.error("Problem getting ADM health.", e);
843 private String getDatabaseHealth() {
844 log.info("Determining database health...");
846 Connection connection = dbLib.getConnection();
847 log.debug("DBLib isActive(): {}", dbLib.isActive());
848 log.debug("DBLib isReadOnly(): {}", connection.isReadOnly());
849 log.debug("DBLib isClosed(): {}", connection.isClosed());
850 if(!dbLib.isActive() || connection.isClosed() || connection.isReadOnly()) {
851 log.warn("Database is FAULTY");
856 log.info("Database is HEALTHY");
857 } catch(SQLException e) {
858 log.error("Database is FAULTY");
859 log.error("Error", e);
866 private String getRequestContent(String path, HttpMethod method) throws IOException {
867 return getRequestContent(path, method, null);
870 private String getRequestContent(String path, HttpMethod method, String input) throws IOException {
871 HttpURLConnection connection = getConnection(path);
872 connection.setRequestMethod(method.getMethod());
873 connection.setDoInput(true);
876 sendPayload(input, connection);
879 BufferedReader bufferedReader = new BufferedReader(new InputStreamReader(connection.getInputStream()));
881 StringBuilder content = new StringBuilder();
882 while((inputLine = bufferedReader.readLine()) != null) {
883 content.append(inputLine);
885 bufferedReader.close();
886 connection.disconnect();
888 String response = content.toString();
889 log.debug("getRequestContent(): Response:\n{}", response);
893 private int getRequestStatus(String path, HttpMethod method) throws IOException {
894 return getRequestStatus(path, method, null);
897 private int getRequestStatus(String path, HttpMethod method, String input) throws IOException {
898 HttpURLConnection connection = getConnection(path);
899 connection.setRequestMethod(method.getMethod());
900 connection.setDoInput(true);
903 sendPayload(input, connection);
905 int response = connection.getResponseCode();
906 log.info("Received {} response code from {}", response, path);
907 connection.disconnect();
911 private void sendPayload(String input, HttpURLConnection connection) throws IOException {
912 byte[] out = input.getBytes(StandardCharsets.UTF_8);
913 int length = out.length;
915 connection.setFixedLengthStreamingMode(length);
916 connection.setRequestProperty("Content-Type", "application/json");
917 connection.setDoOutput(true);
918 connection.connect();
919 try(OutputStream os = connection.getOutputStream()) {
924 private HttpURLConnection getConnection(String host) throws IOException {
925 log.info("Getting connection to: {}", host);
926 URL url = new URL(host);
927 String auth = "Basic " + javax.xml.bind.DatatypeConverter.printBase64Binary(credentials.getBytes());
928 HttpURLConnection connection = (HttpURLConnection) url.openConnection();
929 connection.addRequestProperty("Authorization", auth);
930 connection.setRequestProperty("Connection", "keep-alive");
931 connection.setRequestProperty("Proxy-Connection", "keep-alive");
940 enum SiteConfiguration {
950 private String method;
951 HttpMethod(String method) {
952 this.method = method;
954 public String getMethod() {
960 static final String SITE_IDENTIFIER = "site.identifier";
961 static final String CONTROLLER_USE_SSL = "controller.useSsl";
962 static final String CONTROLLER_PORT_SSL = "controller.port.ssl";
963 static final String CONTROLLER_PORT_HTTP = "controller.port.http";
964 static final String CONTROLLER_PORT_AKKA = "controller.port.akka";
965 static final String CONTROLLER_CREDENTIALS = "controller.credentials";
966 static final String AKKA_CONF_LOCATION = "akka.conf.location";
967 static final String MBEAN_CLUSTER = "mbean.cluster";
968 static final String MBEAN_SHARD_MANAGER = "mbean.shardManager";
969 static final String MBEAN_SHARD_CONFIG = "mbean.shard.config";
970 static final String ADM_USE_SSL = "adm.useSsl";
971 static final String ADM_PORT_SSL = "adm.port.ssl";
972 static final String ADM_PORT_HTTP = "adm.port.http";
973 static final String ADM_FQDN = "adm.fqdn";
974 static final String ADM_HEALTHCHECK= "adm.healthcheck";