use of org.apache.hadoop.hive.ql.exec.repl.ReplStatsTracker in project hive by apache.
the class TestReplicationMetricSink method testSuccessBootstrapDumpMetrics.
@Test
public void testSuccessBootstrapDumpMetrics() throws Exception {
ReplicationMetricCollector bootstrapDumpMetricCollector = new BootstrapDumpMetricCollector("testAcidTablesReplLoadBootstrapIncr_1592205875387", "hdfs://localhost:65158/tmp/org_apache_hadoop_hive_ql_parse_TestReplicationScenarios_245261428230295" + "/hrepl0/dGVzdGFjaWR0YWJsZXNyZXBsbG9hZGJvb3RzdHJhcGluY3JfMTU5MjIwNTg3NTM4Nw==/0/hive", conf);
Map<String, Long> metricMap = new HashMap<>();
metricMap.put(ReplUtils.MetricName.TABLES.name(), (long) 10);
metricMap.put(ReplUtils.MetricName.FUNCTIONS.name(), (long) 1);
bootstrapDumpMetricCollector.reportStageStart("dump", metricMap);
bootstrapDumpMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.TABLES.name(), 1);
bootstrapDumpMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.TABLES.name(), 2);
bootstrapDumpMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.FUNCTIONS.name(), 1);
bootstrapDumpMetricCollector.reportStageEnd("dump", Status.SUCCESS, 10, new SnapshotUtils.ReplSnapshotCount(), new ReplStatsTracker(0));
bootstrapDumpMetricCollector.reportEnd(Status.SUCCESS);
Metadata expectedMetadata = new Metadata("testAcidTablesReplLoadBootstrapIncr_1592205875387", Metadata.ReplicationType.BOOTSTRAP, "dummyDir");
expectedMetadata.setLastReplId(10);
Progress expectedProgress = new Progress();
expectedProgress.setStatus(Status.SUCCESS);
Stage dumpStage = new Stage("dump", Status.SUCCESS, 0);
dumpStage.setEndTime(0);
Metric expectedTableMetric = new Metric(ReplUtils.MetricName.TABLES.name(), 10);
expectedTableMetric.setCurrentCount(3);
Metric expectedFuncMetric = new Metric(ReplUtils.MetricName.FUNCTIONS.name(), 1);
expectedFuncMetric.setCurrentCount(1);
dumpStage.addMetric(expectedTableMetric);
dumpStage.addMetric(expectedFuncMetric);
expectedProgress.addStage(dumpStage);
ReplicationMetric expectedMetric = new ReplicationMetric(1, "repl", 0, expectedMetadata);
expectedMetric.setProgress(expectedProgress);
Thread.sleep(1000 * 20);
GetReplicationMetricsRequest metricsRequest = new GetReplicationMetricsRequest();
metricsRequest.setPolicy("repl");
ReplicationMetricList actualReplicationMetrics = Hive.get(conf).getMSC().getReplicationMetrics(metricsRequest);
ReplicationMetrics actualThriftMetric = actualReplicationMetrics.getReplicationMetricList().get(0);
ObjectMapper mapper = new ObjectMapper();
ReplicationMetric actualMetric = new ReplicationMetric(actualThriftMetric.getScheduledExecutionId(), actualThriftMetric.getPolicy(), actualThriftMetric.getDumpExecutionId(), mapper.readValue(actualThriftMetric.getMetadata(), Metadata.class));
actualMetric.setMessageFormat(actualThriftMetric.getMessageFormat());
ProgressMapper progressMapper = mapper.readValue(deSerialize(actualThriftMetric.getProgress()), ProgressMapper.class);
Progress progress = new Progress();
progress.setStatus(progressMapper.getStatus());
for (StageMapper stageMapper : progressMapper.getStages()) {
Stage stage = new Stage();
stage.setName(stageMapper.getName());
stage.setStatus(stageMapper.getStatus());
stage.setStartTime(stageMapper.getStartTime());
stage.setEndTime(stageMapper.getEndTime());
for (Metric metric : stageMapper.getMetrics()) {
stage.addMetric(metric);
}
progress.addStage(stage);
}
actualMetric.setProgress(progress);
checkSuccess(actualMetric, expectedMetric, "dump", Arrays.asList(ReplUtils.MetricName.TABLES.name(), ReplUtils.MetricName.FUNCTIONS.name()));
// Incremental
conf.set(Constants.SCHEDULED_QUERY_EXECUTIONID, "2");
ReplicationMetricCollector incrementDumpMetricCollector = new IncrementalDumpMetricCollector("testAcidTablesReplLoadBootstrapIncr_1592205875387", "hdfs://localhost:65158/tmp/org_apache_hadoop_hive_ql_parse_TestReplicationScenarios_245261428230295" + "/hrepl0/dGVzdGFjaWR0YWJsZXNyZXBsbG9hZGJvb3RzdHJhcGluY3JfMTU5MjIwNTg3NTM4Nw==/0/hive", conf);
metricMap = new HashMap<>();
metricMap.put(ReplUtils.MetricName.EVENTS.name(), (long) 10);
incrementDumpMetricCollector.reportStageStart("dump", metricMap);
incrementDumpMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.EVENTS.name(), 10);
incrementDumpMetricCollector.reportStageEnd("dump", Status.SUCCESS, 10, new SnapshotUtils.ReplSnapshotCount(), new ReplStatsTracker(0));
incrementDumpMetricCollector.reportEnd(Status.SUCCESS);
expectedMetadata = new Metadata("testAcidTablesReplLoadBootstrapIncr_1592205875387", Metadata.ReplicationType.INCREMENTAL, "dummyDir");
expectedMetadata.setLastReplId(10);
expectedProgress = new Progress();
expectedProgress.setStatus(Status.SUCCESS);
dumpStage = new Stage("dump", Status.SUCCESS, 0);
dumpStage.setEndTime(0);
Metric expectedEventsMetric = new Metric(ReplUtils.MetricName.EVENTS.name(), 10);
expectedEventsMetric.setCurrentCount(10);
dumpStage.addMetric(expectedEventsMetric);
expectedProgress.addStage(dumpStage);
expectedMetric = new ReplicationMetric(2, "repl", 0, expectedMetadata);
expectedMetric.setProgress(expectedProgress);
Thread.sleep(1000 * 20);
metricsRequest = new GetReplicationMetricsRequest();
metricsRequest.setPolicy("repl");
actualReplicationMetrics = Hive.get(conf).getMSC().getReplicationMetrics(metricsRequest);
Assert.assertEquals(2, actualReplicationMetrics.getReplicationMetricListSize());
actualThriftMetric = actualReplicationMetrics.getReplicationMetricList().get(0);
mapper = new ObjectMapper();
actualMetric = new ReplicationMetric(actualThriftMetric.getScheduledExecutionId(), actualThriftMetric.getPolicy(), actualThriftMetric.getDumpExecutionId(), mapper.readValue(actualThriftMetric.getMetadata(), Metadata.class));
actualMetric.setMessageFormat(actualThriftMetric.getMessageFormat());
progressMapper = mapper.readValue(deSerialize(actualThriftMetric.getProgress()), ProgressMapper.class);
progress = new Progress();
progress.setStatus(progressMapper.getStatus());
for (StageMapper stageMapper : progressMapper.getStages()) {
Stage stage = new Stage();
stage.setName(stageMapper.getName());
stage.setStatus(stageMapper.getStatus());
stage.setStartTime(stageMapper.getStartTime());
stage.setEndTime(stageMapper.getEndTime());
for (Metric metric : stageMapper.getMetrics()) {
stage.addMetric(metric);
}
progress.addStage(stage);
}
actualMetric.setProgress(progress);
checkSuccessIncremental(actualMetric, expectedMetric, "dump", Arrays.asList(ReplUtils.MetricName.EVENTS.name()));
// Failover Metrics Sink
Mockito.when(fmd.getFailoverEventId()).thenReturn(100L);
Mockito.when(fmd.getFilePath()).thenReturn("hdfs://localhost:65158/tmp/org_apache_hadoop_hive_ql_parse_TestReplicationScenarios_245261428230295" + "/hrepl0/dGVzdGFjaWR0YWJsZXNyZXBsbG9hZGJvb3RzdHJhcGluY3JfMTU5MjIwNTg3NTM4Nw==/0/hive/");
conf.set(Constants.SCHEDULED_QUERY_EXECUTIONID, "3");
String stagingDir = "hdfs://localhost:65158/tmp/org_apache_hadoop_hive_ql_parse_TestReplicationScenarios_245261428230295" + "/hrepl0/dGVzdGFjaWR0YWJsZXNyZXBsbG9hZGJvb3RzdHJhcGluY3JfMTU5MjIwNTg3NTM4Nw==/0/hive/";
ReplicationMetricCollector failoverDumpMetricCollector = new IncrementalDumpMetricCollector("testAcidTablesReplLoadBootstrapIncr_1592205875387", stagingDir, conf);
metricMap = new HashMap<String, Long>() {
{
put(ReplUtils.MetricName.EVENTS.name(), (long) 10);
}
};
failoverDumpMetricCollector.reportFailoverStart("dump", metricMap, fmd);
failoverDumpMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.EVENTS.name(), 10);
failoverDumpMetricCollector.reportStageEnd("dump", Status.SUCCESS, 10, new SnapshotUtils.ReplSnapshotCount(), new ReplStatsTracker(0));
failoverDumpMetricCollector.reportEnd(Status.FAILOVER_READY);
expectedMetadata = new Metadata("testAcidTablesReplLoadBootstrapIncr_1592205875387", Metadata.ReplicationType.INCREMENTAL, "dummyDir");
expectedMetadata.setLastReplId(10);
expectedMetadata.setFailoverEventId(100);
expectedMetadata.setFailoverMetadataLoc(stagingDir + FailoverMetaData.FAILOVER_METADATA);
expectedProgress = new Progress();
expectedProgress.setStatus(Status.FAILOVER_READY);
dumpStage = new Stage("dump", Status.SUCCESS, 0);
dumpStage.setEndTime(0);
expectedEventsMetric = new Metric(ReplUtils.MetricName.EVENTS.name(), 10);
expectedEventsMetric.setCurrentCount(10);
dumpStage.addMetric(expectedEventsMetric);
expectedProgress.addStage(dumpStage);
expectedMetric = new ReplicationMetric(3, "repl", 0, expectedMetadata);
expectedMetric.setProgress(expectedProgress);
Thread.sleep(1000 * 20);
metricsRequest = new GetReplicationMetricsRequest();
metricsRequest.setPolicy("repl");
actualReplicationMetrics = Hive.get(conf).getMSC().getReplicationMetrics(metricsRequest);
Assert.assertEquals(3, actualReplicationMetrics.getReplicationMetricListSize());
actualThriftMetric = actualReplicationMetrics.getReplicationMetricList().get(0);
mapper = new ObjectMapper();
actualMetric = new ReplicationMetric(actualThriftMetric.getScheduledExecutionId(), actualThriftMetric.getPolicy(), actualThriftMetric.getDumpExecutionId(), mapper.readValue(actualThriftMetric.getMetadata(), Metadata.class));
actualMetric.setMessageFormat(actualThriftMetric.getMessageFormat());
progressMapper = mapper.readValue(deSerialize(actualThriftMetric.getProgress()), ProgressMapper.class);
progress = new Progress();
progress.setStatus(progressMapper.getStatus());
for (StageMapper stageMapper : progressMapper.getStages()) {
Stage stage = new Stage();
stage.setName(stageMapper.getName());
stage.setStatus(stageMapper.getStatus());
stage.setStartTime(stageMapper.getStartTime());
stage.setEndTime(stageMapper.getEndTime());
for (Metric metric : stageMapper.getMetrics()) {
stage.addMetric(metric);
}
progress.addStage(stage);
}
actualMetric.setProgress(progress);
checkSuccessIncremental(actualMetric, expectedMetric, "dump", Arrays.asList(ReplUtils.MetricName.EVENTS.name()));
}
use of org.apache.hadoop.hive.ql.exec.repl.ReplStatsTracker in project hive by apache.
the class TestReplicationMetricSink method testReplStatsInMetrics.
@Test
public void testReplStatsInMetrics() throws HiveException, InterruptedException, TException {
int origRMProgress = ReplStatsTracker.RM_PROGRESS_LENGTH;
ReplStatsTracker.RM_PROGRESS_LENGTH = 10;
ReplicationMetricCollector incrementDumpMetricCollector = new IncrementalDumpMetricCollector("testAcidTablesReplLoadBootstrapIncr_1592205875387", "hdfs://localhost:65158/tmp/org_apache_hadoop_hive_ql_parse_TestReplicationScenarios_245261428230295" + "/hrepl0/dGVzdGFjaWR0YWJsZXNyZXBsbG9hZGJvb3RzdHJhcGluY3JfMTU5MjIwNTg3NTM4Nw==/0/hive", conf);
Map<String, Long> metricMap = new HashMap<>();
ReplStatsTracker repl = Mockito.mock(ReplStatsTracker.class);
Mockito.when(repl.toString()).thenReturn(RandomStringUtils.randomAlphabetic(1000));
metricMap.put(ReplUtils.MetricName.EVENTS.name(), (long) 10);
incrementDumpMetricCollector.reportStageStart("dump", metricMap);
incrementDumpMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.EVENTS.name(), 10);
incrementDumpMetricCollector.reportStageEnd("dump", Status.SUCCESS, 10, new SnapshotUtils.ReplSnapshotCount(), repl);
Thread.sleep(1000 * 20);
GetReplicationMetricsRequest metricsRequest = new GetReplicationMetricsRequest();
metricsRequest.setPolicy("repl");
ReplicationMetricList actualReplicationMetrics = Hive.get(conf).getMSC().getReplicationMetrics(metricsRequest);
String progress = deSerialize(actualReplicationMetrics.getReplicationMetricList().get(0).getProgress());
assertTrue(progress, progress.contains("ERROR: RM_PROGRESS LIMIT EXCEEDED."));
ReplStatsTracker.RM_PROGRESS_LENGTH = origRMProgress;
// Testing K_MAX
repl = new ReplStatsTracker(15);
Assert.assertEquals(ReplStatsTracker.TOP_K_MAX, repl.getK());
}
use of org.apache.hadoop.hive.ql.exec.repl.ReplStatsTracker in project hive by apache.
the class TestReplicationMetricCollector method testSuccessIncrDumpMetrics.
@Test
public void testSuccessIncrDumpMetrics() throws Exception {
ReplicationMetricCollector incrDumpMetricCollector = new IncrementalDumpMetricCollector("db", "dummyDir", conf);
Map<String, Long> metricMap = new HashMap<>();
metricMap.put(ReplUtils.MetricName.TABLES.name(), (long) 10);
metricMap.put(ReplUtils.MetricName.FUNCTIONS.name(), (long) 1);
incrDumpMetricCollector.reportStageStart("dump", metricMap);
incrDumpMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.TABLES.name(), 1);
List<ReplicationMetric> actualMetrics = MetricCollector.getInstance().getMetrics();
Assert.assertEquals(1, actualMetrics.size());
incrDumpMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.TABLES.name(), 2);
incrDumpMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.FUNCTIONS.name(), 1);
actualMetrics = MetricCollector.getInstance().getMetrics();
Assert.assertEquals(1, actualMetrics.size());
incrDumpMetricCollector.reportStageEnd("dump", Status.SUCCESS, 10, new SnapshotUtils.ReplSnapshotCount(), new ReplStatsTracker(0));
incrDumpMetricCollector.reportEnd(Status.SUCCESS);
actualMetrics = MetricCollector.getInstance().getMetrics();
Assert.assertEquals(1, actualMetrics.size());
Metadata expectedMetadata = new Metadata("db", Metadata.ReplicationType.INCREMENTAL, "dummyDir");
expectedMetadata.setLastReplId(10);
Progress expectedProgress = new Progress();
expectedProgress.setStatus(Status.SUCCESS);
Stage dumpStage = new Stage("dump", Status.SUCCESS, 0);
dumpStage.setEndTime(0);
Metric expectedTableMetric = new Metric(ReplUtils.MetricName.TABLES.name(), 10);
expectedTableMetric.setCurrentCount(3);
Metric expectedFuncMetric = new Metric(ReplUtils.MetricName.FUNCTIONS.name(), 1);
expectedFuncMetric.setCurrentCount(1);
dumpStage.addMetric(expectedTableMetric);
dumpStage.addMetric(expectedFuncMetric);
expectedProgress.addStage(dumpStage);
ReplicationMetric expectedMetric = new ReplicationMetric(1, "repl", 0, expectedMetadata);
expectedMetric.setProgress(expectedProgress);
checkSuccess(actualMetrics.get(0), expectedMetric, "dump", Arrays.asList(ReplUtils.MetricName.TABLES.name(), ReplUtils.MetricName.FUNCTIONS.name()));
}
use of org.apache.hadoop.hive.ql.exec.repl.ReplStatsTracker in project hive by apache.
the class TestReplicationMetricCollector method testReplStatsTrackerLimit.
@Test
public void testReplStatsTrackerLimit() {
MessageSerializer serializer = MessageFactory.getDefaultInstanceForReplMetrics(conf).getSerializer();
ReplStatsTracker repl = new ReplStatsTracker(10);
// Check for k=10
generateStatsString(10, repl);
String replStatsTracker = repl.toString();
String gzipSerialized = serializer.serialize(replStatsTracker);
assertTrue("ReplStat string is " + gzipSerialized.length(), gzipSerialized.length() < ReplStatsTracker.RM_PROGRESS_LENGTH);
// Check for k=5
repl = new ReplStatsTracker(5);
generateStatsString(5, repl);
replStatsTracker = repl.toString();
gzipSerialized = serializer.serialize(replStatsTracker);
assertTrue("ReplStat string is " + gzipSerialized.length(), gzipSerialized.length() < ReplStatsTracker.RM_PROGRESS_LENGTH);
// Check for k=2 & check NaN values doesn't get messed up due to formatter
repl = new ReplStatsTracker(2);
generateStatsString(2, repl);
assertTrue(repl.toString().contains("NaN"));
}
use of org.apache.hadoop.hive.ql.exec.repl.ReplStatsTracker in project hive by apache.
the class TestReplicationMetricCollector method testSuccessBootstrapLoadMetrics.
@Test
public void testSuccessBootstrapLoadMetrics() throws Exception {
ReplicationMetricCollector bootstrapLoadMetricCollector = new BootstrapLoadMetricCollector("db", "dummyDir", 1, conf);
Map<String, Long> metricMap = new HashMap<>();
metricMap.put(ReplUtils.MetricName.TABLES.name(), (long) 10);
metricMap.put(ReplUtils.MetricName.FUNCTIONS.name(), (long) 1);
bootstrapLoadMetricCollector.reportStageStart("dump", metricMap);
bootstrapLoadMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.TABLES.name(), 1);
List<ReplicationMetric> actualMetrics = MetricCollector.getInstance().getMetrics();
Assert.assertEquals(1, actualMetrics.size());
bootstrapLoadMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.TABLES.name(), 2);
bootstrapLoadMetricCollector.reportStageProgress("dump", ReplUtils.MetricName.FUNCTIONS.name(), 1);
actualMetrics = MetricCollector.getInstance().getMetrics();
Assert.assertEquals(1, actualMetrics.size());
bootstrapLoadMetricCollector.reportStageEnd("dump", Status.SUCCESS, 10, new SnapshotUtils.ReplSnapshotCount(), new ReplStatsTracker(0));
bootstrapLoadMetricCollector.reportEnd(Status.SUCCESS);
actualMetrics = MetricCollector.getInstance().getMetrics();
Assert.assertEquals(1, actualMetrics.size());
Metadata expectedMetadata = new Metadata("db", Metadata.ReplicationType.BOOTSTRAP, "dummyDir");
expectedMetadata.setLastReplId(10);
Progress expectedProgress = new Progress();
expectedProgress.setStatus(Status.SUCCESS);
Stage dumpStage = new Stage("dump", Status.SUCCESS, 0);
dumpStage.setEndTime(0);
Metric expectedTableMetric = new Metric(ReplUtils.MetricName.TABLES.name(), 10);
expectedTableMetric.setCurrentCount(3);
Metric expectedFuncMetric = new Metric(ReplUtils.MetricName.FUNCTIONS.name(), 1);
expectedFuncMetric.setCurrentCount(1);
dumpStage.addMetric(expectedTableMetric);
dumpStage.addMetric(expectedFuncMetric);
expectedProgress.addStage(dumpStage);
ReplicationMetric expectedMetric = new ReplicationMetric(1, "repl", 1, expectedMetadata);
expectedMetric.setProgress(expectedProgress);
checkSuccess(actualMetrics.get(0), expectedMetric, "dump", Arrays.asList(ReplUtils.MetricName.TABLES.name(), ReplUtils.MetricName.FUNCTIONS.name()));
}
Aggregations