|
20 | 20 |
|
21 | 21 | import io.opentelemetry.api.OpenTelemetry; |
22 | 22 | import io.opentelemetry.api.metrics.BatchCallback; |
| 23 | +import io.opentelemetry.api.metrics.DoubleHistogram; |
| 24 | +import io.opentelemetry.api.metrics.LongHistogram; |
23 | 25 | import io.opentelemetry.api.metrics.ObservableLongMeasurement; |
| 26 | +import java.util.Arrays; |
| 27 | +import java.util.concurrent.TimeUnit; |
24 | 28 | import org.apache.bookkeeper.mledger.ManagedLedger; |
25 | 29 | import org.apache.pulsar.opentelemetry.Constants; |
26 | 30 |
|
27 | 31 | public class OpenTelemetryManagedLedgerStats implements AutoCloseable { |
28 | 32 |
|
| 33 | + // ml-level metrics |
| 34 | + |
29 | 35 | // Replaces pulsar_ml_AddEntryMessagesRate |
30 | 36 | public static final String ADD_ENTRY_COUNTER = "pulsar.broker.managed_ledger.message.outgoing.count"; |
31 | 37 | private final ObservableLongMeasurement addEntryCounter; |
@@ -62,6 +68,29 @@ public class OpenTelemetryManagedLedgerStats implements AutoCloseable { |
62 | 68 |
|
63 | 69 | private final BatchCallback batchCallback; |
64 | 70 |
|
| 71 | + // namespace-level metrics |
| 72 | + |
| 73 | + // Replaces ['pulsar_ml_AddEntryLatencyBuckets', 'pulsar_ml_AddEntryLatencyBuckets_OVERFLOW', |
| 74 | + // 'pulsar_storage_write_latency_*'] |
| 75 | + public static final String ADD_ENTRY_LATENCY_HISTOGRAM = "pulsar.broker.managed_ledger.message.outgoing.latency"; |
| 76 | + private final DoubleHistogram addEntryLatencyHistogram; |
| 77 | + |
| 78 | + // Replaces ['pulsar_ml_LedgerAddEntryLatencyBuckets', 'pulsar_ml_LedgerAddEntryLatencyBuckets_OVERFLOW', |
| 79 | + // 'pulsar_storage_ledger_write_latency_*'] |
| 80 | + public static final String LEDGER_ADD_ENTRY_LATENCY_HISTOGRAM = |
| 81 | + "pulsar.broker.managed_ledger.message.outgoing.ledger.latency"; |
| 82 | + private final DoubleHistogram ledgerAddEntryLatencyHistogram; |
| 83 | + |
| 84 | + // Replaces ['pulsar_ml_LedgerSwitchLatencyBuckets', 'pulsar_ml_LedgerSwitchLatencyBuckets_OVERFLOW'] |
| 85 | + public static final String LEDGER_SWITCH_LATENCY_HISTOGRAM = |
| 86 | + "pulsar.broker.managed_ledger.ledger.switch.latency"; |
| 87 | + private final DoubleHistogram ledgerSwitchLatencyHistogram; |
| 88 | + |
| 89 | + // Replaces ['pulsar_ml_EntrySizeBuckets', 'pulsar_ml_EntrySizeBuckets_OVERFLOW', |
| 90 | + // 'pulsar_entry_size_*'] |
| 91 | + public static final String ENTRY_SIZE_HISTOGRAM = "pulsar.broker.managed_ledger.entry.size"; |
| 92 | + private final LongHistogram entrySizeHistogram; |
| 93 | + |
65 | 94 | public OpenTelemetryManagedLedgerStats(OpenTelemetry openTelemetry, ManagedLedgerFactoryImpl factory) { |
66 | 95 | var meter = openTelemetry.getMeter(Constants.BROKER_INSTRUMENTATION_SCOPE_NAME); |
67 | 96 |
|
@@ -124,6 +153,39 @@ public OpenTelemetryManagedLedgerStats(OpenTelemetry openTelemetry, ManagedLedge |
124 | 153 | bytesInCounter, |
125 | 154 | readEntryCacheMissCounter, |
126 | 155 | markDeleteCounter); |
| 156 | + |
| 157 | + addEntryLatencyHistogram = meter |
| 158 | + .histogramBuilder(ADD_ENTRY_LATENCY_HISTOGRAM) |
| 159 | + .setDescription("End-to-end write latency, including time spent in the executor queue.") |
| 160 | + .setUnit("s") |
| 161 | + .setExplicitBucketBoundariesAdvice(Arrays.asList(0.001, 0.005, 0.01, 0.02, 0.05, 0.1, |
| 162 | + 0.2, 0.5, 1.0, 5.0, 30.0)) |
| 163 | + .build(); |
| 164 | + |
| 165 | + ledgerAddEntryLatencyHistogram = meter |
| 166 | + .histogramBuilder(LEDGER_ADD_ENTRY_LATENCY_HISTOGRAM) |
| 167 | + .setDescription("End-to end write latency.") |
| 168 | + .setUnit("s") |
| 169 | + .setExplicitBucketBoundariesAdvice(Arrays.asList(0.001, 0.005, 0.01, 0.02, 0.05, 0.1, |
| 170 | + 0.2, 0.5, 1.0, 5.0, 30.0)) |
| 171 | + .build(); |
| 172 | + |
| 173 | + ledgerSwitchLatencyHistogram = meter |
| 174 | + .histogramBuilder(LEDGER_SWITCH_LATENCY_HISTOGRAM) |
| 175 | + .setDescription("Time taken to switch to a new ledger.") |
| 176 | + .setUnit("s") |
| 177 | + .setExplicitBucketBoundariesAdvice(Arrays.asList(0.001, 0.005, 0.01, 0.02, 0.05, 0.1, |
| 178 | + 0.2, 0.5, 1.0, 5.0, 30.0)) |
| 179 | + .build(); |
| 180 | + |
| 181 | + entrySizeHistogram = meter |
| 182 | + .histogramBuilder(ENTRY_SIZE_HISTOGRAM) |
| 183 | + .ofLongs() |
| 184 | + .setDescription("Size of entries written to the ledger.") |
| 185 | + .setUnit("By") |
| 186 | + .setExplicitBucketBoundariesAdvice(Arrays.asList(128L, 512L, 1024L, 2048L, 4096L, 16_384L, |
| 187 | + 102_400L, 1_048_576L)) |
| 188 | + .build(); |
127 | 189 | } |
128 | 190 |
|
129 | 191 | @Override |
@@ -151,4 +213,24 @@ private void recordMetrics(ManagedLedger ml) { |
151 | 213 | markDeleteCounter.record(stats.getMarkDeleteTotal(), attributes); |
152 | 214 | readEntryCacheMissCounter.record(stats.getReadEntriesOpsCacheMissesTotal(), attributes); |
153 | 215 | } |
| 216 | + |
| 217 | + void recordAddEntryLatency(long latency, TimeUnit unit, ManagedLedger ml) { |
| 218 | + final var attributes = ml.getManagedLedgerAttributes().getAttributesOnlyNamespace(); |
| 219 | + this.addEntryLatencyHistogram.record(unit.toMillis(latency) / 1000.0, attributes); |
| 220 | + } |
| 221 | + |
| 222 | + void recordLedgerAddEntryLatency(long latency, TimeUnit unit, ManagedLedger ml) { |
| 223 | + final var attributes = ml.getManagedLedgerAttributes().getAttributesOnlyNamespace(); |
| 224 | + this.ledgerAddEntryLatencyHistogram.record(unit.toMillis(latency) / 1000.0, attributes); |
| 225 | + } |
| 226 | + |
| 227 | + void recordLedgerSwitchLatency(long latency, TimeUnit unit, ManagedLedger ml) { |
| 228 | + final var attributes = ml.getManagedLedgerAttributes().getAttributesOnlyNamespace(); |
| 229 | + this.ledgerSwitchLatencyHistogram.record(unit.toMillis(latency) / 1000.0, attributes); |
| 230 | + } |
| 231 | + |
| 232 | + void recordEntrySize(long entrySize, ManagedLedger ml) { |
| 233 | + final var attributes = ml.getManagedLedgerAttributes().getAttributesOnlyNamespace(); |
| 234 | + this.entrySizeHistogram.record(entrySize, attributes); |
| 235 | + } |
154 | 236 | } |
0 commit comments