/**
* Copyright (C) 2012 LinkedIn Inc <opensource@linkedin.com>
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.linkedin.helix.healthcheck;
import java.util.Date;
import java.util.Map;
import java.util.Set;
import org.testng.Assert;
import org.testng.annotations.AfterClass;
import org.testng.annotations.BeforeClass;
import org.testng.annotations.Test;
import com.linkedin.helix.HelixDataAccessor;
import com.linkedin.helix.HelixManager;
import com.linkedin.helix.NotificationContext;
import com.linkedin.helix.PropertyKey.Builder;
import com.linkedin.helix.TestHelper;
import com.linkedin.helix.TestHelper.StartCMResult;
import com.linkedin.helix.ZNRecord;
import com.linkedin.helix.alerts.AlertValueAndStatus;
import com.linkedin.helix.controller.HelixControllerMain;
import com.linkedin.helix.healthcheck.HealthStatsAggregationTask;
import com.linkedin.helix.healthcheck.ParticipantHealthReportCollectorImpl;
import com.linkedin.helix.integration.ZkIntegrationTestBase;
import com.linkedin.helix.manager.zk.ZKHelixDataAccessor;
import com.linkedin.helix.manager.zk.ZNRecordSerializer;
import com.linkedin.helix.manager.zk.ZkBaseDataAccessor;
import com.linkedin.helix.manager.zk.ZkClient;
import com.linkedin.helix.mock.storage.MockEspressoHealthReportProvider;
import com.linkedin.helix.mock.storage.MockParticipant;
import com.linkedin.helix.mock.storage.MockTransition;
import com.linkedin.helix.model.Message;
import com.linkedin.helix.tools.ClusterSetup;
import com.linkedin.helix.tools.ClusterStateVerifier;
public class TestStalenessAlert extends ZkIntegrationTestBase
{
ZkClient _zkClient;
protected ClusterSetup _setupTool = null;
protected final String _alertStr = "EXP(decay(1)(localhost_*.reportingage))CMP(GREATER)CON(600)";
protected final String _alertStatusStr = _alertStr+" : (localhost_12918.reportingage)";
protected final String _dbName = "TestDB0";
@BeforeClass ()
public void beforeClass() throws Exception
{
_zkClient = new ZkClient(ZK_ADDR);
_zkClient.setZkSerializer(new ZNRecordSerializer());
_setupTool = new ClusterSetup(ZK_ADDR);
}
@AfterClass
public void afterClass()
{
_zkClient.close();
}
public class StalenessAlertTransition extends MockTransition
{
@Override
public void doTransition(Message message, NotificationContext context)
{
HelixManager manager = context.getManager();
HelixDataAccessor accessor = manager.getHelixDataAccessor();
String fromState = message.getFromState();
String toState = message.getToState();
String instance = message.getTgtName();
String partition = message.getPartitionName();
if (fromState.equalsIgnoreCase("SLAVE")
&& toState.equalsIgnoreCase("MASTER"))
{
//add a stat and report to ZK
//perhaps should keep reporter per instance...
ParticipantHealthReportCollectorImpl reporter =
new ParticipantHealthReportCollectorImpl(manager, instance);
MockEspressoHealthReportProvider provider = new
MockEspressoHealthReportProvider();
reporter.addHealthReportProvider(provider);
String statName = "latency";
provider.setStat(_dbName, statName,"15");
reporter.transmitHealthReports();
/*
for (int i = 0; i < 5; i++)
{
accessor.setProperty(PropertyType.HEALTHREPORT,
new ZNRecord("mockAlerts" + i),
instance,
"mockAlerts");
try
{
Thread.sleep(1000);
}
catch (InterruptedException e)
{
// TODO Auto-generated catch block
e.printStackTrace();
}
}
*/
}
}
}
@Test()
public void testStalenessAlert() throws Exception
{
String clusterName = getShortClassName();
MockParticipant[] participants = new MockParticipant[5];
System.out.println("START TestStalenessAlert at " + new Date(System.currentTimeMillis()));
TestHelper.setupCluster(clusterName,
ZK_ADDR,
12918, // participant start port
"localhost", // participant name prefix
"TestDB", // resource name prefix
1, // resources
10, // partitions per resource
5, // number of nodes //change back to 5!!!
3, // replicas //change back to 3!!!
"MasterSlave",
true); // do rebalance
// enableHealthCheck(clusterName);
_setupTool.getClusterManagementTool().addAlert(clusterName, _alertStr);
StartCMResult cmResult = TestHelper.startController(clusterName,
"controller_0",
ZK_ADDR,
HelixControllerMain.STANDALONE);
// start participants
for (int i = 0; i < 5; i++) //!!!change back to 5
{
String instanceName = "localhost_" + (12918 + i);
participants[i] = new MockParticipant(clusterName,
instanceName,
ZK_ADDR,
new StalenessAlertTransition());
participants[i].syncStart();
// new Thread(participants[i]).start();
}
boolean result = ClusterStateVerifier.verifyByPolling(
new ClusterStateVerifier.BestPossAndExtViewZkVerifier(ZK_ADDR, clusterName));
Assert.assertTrue(result);
// HealthAggregationTask is supposed to run by a timer every 30s
// To make sure HealthAggregationTask is run, we invoke it explicitly for this test
new HealthStatsAggregationTask(cmResult._manager).run();
//sleep for a few seconds to give stats stage time to trigger
Thread.sleep(3000);
// other verifications go here
ZKHelixDataAccessor accessor = new ZKHelixDataAccessor(clusterName, new ZkBaseDataAccessor(_zkClient));
Builder keyBuilder = accessor.keyBuilder();
//for (int i = 0; i < 1; i++) //change 1 back to 5
//{
//String instance = "localhost_" + (12918 + i);
//String instance = "localhost_12918";
ZNRecord record = accessor.getProperty(keyBuilder.alertStatus()).getRecord();
Map<String, Map<String,String>> recMap = record.getMapFields();
Set<String> keySet = recMap.keySet();
Map<String,String> alertStatusMap = recMap.get(_alertStatusStr);
String val = alertStatusMap.get(AlertValueAndStatus.VALUE_NAME);
boolean fired = Boolean.parseBoolean(alertStatusMap.get(AlertValueAndStatus.FIRED_NAME));
//Assert.assertEquals(Double.parseDouble(val), Double.parseDouble("75.0"));
// Assert.assertFalse(fired);
//}
System.out.println("END TestStalenessAlert at " + new Date(System.currentTimeMillis()));
}
}