report message gap, source gap and sink count in RealtimePlumber (#3744)

* report message gap, source gap and sink count in RealtimePlumber

* report message gap, sink count in Appenderator

* add ingest/events/sourceGap in metrics.md

* remove source gap
This commit is contained in:
kaijianding 2016-12-14 01:23:02 +08:00 committed by Himanshu
parent 07384d6f40
commit 4be3eb0ce7
5 changed files with 43 additions and 1 deletions

View File

@ -109,6 +109,8 @@ These metrics are only available if the RealtimeMetricsMonitor is included in th
|`ingest/merge/time`|Milliseconds spent merging intermediate segments|dataSource.|Depends on configuration. Generally a few minutes at most.|
|`ingest/merge/cpu`|Cpu time in Nanoseconds spent on merging intermediate segments.|dataSource.|Depends on configuration. Generally a few minutes at most.|
|`ingest/handoff/count`|Number of handoffs that happened.|dataSource.|Varies. Generally greater than 0 once every segment granular period if cluster operating normally|
|`ingest/sink/count`|Number of sinks not handoffed.|dataSource.|1~3|
|`ingest/events/messageGap`|Time gap between the data time in event and current system time.|dataSource.|Greater than 0, depends on the time carried in event |
Note: If the JVM does not support CPU time measurement for the current thread, ingest/merge/cpu and ingest/persists/cpu will be 0.

View File

@ -40,6 +40,9 @@ public class FireDepartmentMetrics
private final AtomicLong mergeCpuTime = new AtomicLong(0);
private final AtomicLong persistCpuTime = new AtomicLong(0);
private final AtomicLong handOffCount = new AtomicLong(0);
private final AtomicLong sinkCount = new AtomicLong(0);
private final AtomicLong messageMaxTimestamp = new AtomicLong(0);
private final AtomicLong messageGap = new AtomicLong(0);
public void incrementProcessed()
{
@ -103,6 +106,14 @@ public class FireDepartmentMetrics
handOffCount.incrementAndGet();
}
public void setSinkCount(long sinkCount){
this.sinkCount.set(sinkCount);
}
public void reportMessageMaxTimestamp(long messageMaxTimestamp){
this.messageMaxTimestamp.set(Math.max(messageMaxTimestamp, this.messageMaxTimestamp.get()));
}
public long processed()
{
return processedCount.get();
@ -168,6 +179,20 @@ public class FireDepartmentMetrics
return handOffCount.get();
}
public long sinkCount()
{
return sinkCount.get();
}
public long messageMaxTimestamp()
{
return messageMaxTimestamp.get();
}
public long messageGap()
{
return messageGap.get();
}
public FireDepartmentMetrics snapshot()
{
@ -185,6 +210,9 @@ public class FireDepartmentMetrics
retVal.mergeCpuTime.set(mergeCpuTime.get());
retVal.persistCpuTime.set(persistCpuTime.get());
retVal.handOffCount.set(handOffCount.get());
retVal.sinkCount.set(sinkCount.get());
retVal.messageMaxTimestamp.set(messageMaxTimestamp.get());
retVal.messageGap.set(System.currentTimeMillis() - messageMaxTimestamp.get());
return retVal;
}
@ -210,6 +238,9 @@ public class FireDepartmentMetrics
mergeCpuTime.addAndGet(otherSnapshot.mergeCpuTime());
persistCpuTime.addAndGet(otherSnapshot.persistCpuTime());
handOffCount.addAndGet(otherSnapshot.handOffCount());
sinkCount.addAndGet(otherSnapshot.sinkCount());
messageMaxTimestamp.set(Math.max(messageMaxTimestamp(), otherSnapshot.messageMaxTimestamp()));
messageGap.set(Math.max(messageGap(), otherSnapshot.messageGap()));
return this;
}

View File

@ -96,6 +96,8 @@ public class RealtimeMetricsMonitor extends AbstractMonitor
emitter.emit(builder.build("ingest/merge/time", metrics.mergeTimeMillis() - previous.mergeTimeMillis()));
emitter.emit(builder.build("ingest/merge/cpu", metrics.mergeCpuTime() - previous.mergeCpuTime()));
emitter.emit(builder.build("ingest/handoff/count", metrics.handOffCount() - previous.handOffCount()));
emitter.emit(builder.build("ingest/sink/count", metrics.sinkCount()));
emitter.emit(builder.build("ingest/events/messageGap", metrics.messageGap()));
previousValues.put(fireDepartment, metrics);
}

View File

@ -191,6 +191,7 @@ public class AppenderatorImpl implements Appenderator
}
final Sink sink = getOrCreateSink(identifier);
metrics.reportMessageMaxTimestamp(row.getTimestampFromEpoch());
final int sinkRowsInMemoryBeforeAdd = sink.getNumRowsInMemory();
final int sinkRowsInMemoryAfterAdd;
@ -269,6 +270,7 @@ public class AppenderatorImpl implements Appenderator
}
sinks.put(identifier, retVal);
metrics.setSinkCount(sinks.size());
sinkTimeline.add(retVal.getInterval(), retVal.getVersion(), identifier.getShardSpec().createChunk(retVal));
}
@ -905,6 +907,7 @@ public class AppenderatorImpl implements Appenderator
log.info("Removing sink for segment[%s].", identifier);
sinks.remove(identifier);
metrics.setSinkCount(sinks.size());
droppingSinks.remove(identifier);
sinkTimeline.remove(
sink.getInterval(),

View File

@ -204,7 +204,9 @@ public class RealtimePlumber implements Plumber
@Override
public int add(InputRow row, Supplier<Committer> committerSupplier) throws IndexSizeExceededException
{
final Sink sink = getSink(row.getTimestampFromEpoch());
long messageTimestamp = row.getTimestampFromEpoch();
final Sink sink = getSink(messageTimestamp);
metrics.reportMessageMaxTimestamp(messageTimestamp);
if (sink == null) {
return -1;
}
@ -716,6 +718,7 @@ public class RealtimePlumber implements Plumber
private void addSink(final Sink sink)
{
sinks.put(sink.getInterval().getStartMillis(), sink);
metrics.setSinkCount(sinks.size());
sinkTimeline.add(
sink.getInterval(),
sink.getVersion(),
@ -850,6 +853,7 @@ public class RealtimePlumber implements Plumber
removeSegment(sink, computePersistDir(schema, sink.getInterval()));
log.info("Removing sinkKey %d for segment %s", truncatedTime, sink.getSegment().getIdentifier());
sinks.remove(truncatedTime);
metrics.setSinkCount(sinks.size());
sinkTimeline.remove(
sink.getInterval(),
sink.getVersion(),