|
20 | 20 |
|
21 | 21 | import io.opentelemetry.api.OpenTelemetry; |
22 | 22 | import io.opentelemetry.api.metrics.BatchCallback; |
| 23 | +import io.opentelemetry.api.metrics.DoubleHistogram; |
| 24 | +import io.opentelemetry.api.metrics.LongHistogram; |
23 | 25 | import io.opentelemetry.api.metrics.ObservableLongMeasurement; |
| 26 | +import java.util.Arrays; |
| 27 | +import java.util.concurrent.TimeUnit; |
24 | 28 | import org.apache.bookkeeper.mledger.ManagedLedger; |
25 | 29 | import org.apache.pulsar.opentelemetry.Constants; |
26 | 30 |
|
27 | 31 | public class OpenTelemetryManagedLedgerStats implements AutoCloseable { |
28 | 32 |
|
| 33 | + // ml-level metrics |
| 34 | + |
29 | 35 | // Replaces pulsar_ml_AddEntryMessagesRate |
30 | 36 | public static final String ADD_ENTRY_COUNTER = "pulsar.broker.managed_ledger.message.outgoing.count"; |
31 | 37 | private final ObservableLongMeasurement addEntryCounter; |
@@ -62,6 +68,34 @@ public class OpenTelemetryManagedLedgerStats implements AutoCloseable { |
62 | 68 |
|
63 | 69 | private final BatchCallback batchCallback; |
64 | 70 |
|
| 71 | + // namespace-level metrics |
| 72 | + |
| 73 | + // Histograms support only synchronous mode, so record measurements directly. |
| 74 | + // Synchronous histograms currently do not support delete operations. |
| 75 | + // Therefore, use only namespace-level attributes to avoid leaking high-cardinality attributes (e.g. topic name). |
| 76 | + // See: https://github.com/apache/pulsar/blob/master/pip/pip-264.md |
| 77 | + |
| 78 | + // Replaces ['pulsar_ml_AddEntryLatencyBuckets', 'pulsar_ml_AddEntryLatencyBuckets_OVERFLOW', |
| 79 | + // 'pulsar_storage_write_latency_*'] |
| 80 | + public static final String ADD_ENTRY_LATENCY_HISTOGRAM = "pulsar.broker.managed_ledger.message.outgoing.latency"; |
| 81 | + private final DoubleHistogram addEntryLatencyHistogram; |
| 82 | + |
| 83 | + // Replaces ['pulsar_ml_LedgerAddEntryLatencyBuckets', 'pulsar_ml_LedgerAddEntryLatencyBuckets_OVERFLOW', |
| 84 | + // 'pulsar_storage_ledger_write_latency_*'] |
| 85 | + public static final String LEDGER_ADD_ENTRY_LATENCY_HISTOGRAM = |
| 86 | + "pulsar.broker.managed_ledger.message.outgoing.ledger.latency"; |
| 87 | + private final DoubleHistogram ledgerAddEntryLatencyHistogram; |
| 88 | + |
| 89 | + // Replaces ['pulsar_ml_LedgerSwitchLatencyBuckets', 'pulsar_ml_LedgerSwitchLatencyBuckets_OVERFLOW'] |
| 90 | + public static final String LEDGER_SWITCH_LATENCY_HISTOGRAM = |
| 91 | + "pulsar.broker.managed_ledger.ledger.switch.latency"; |
| 92 | + private final DoubleHistogram ledgerSwitchLatencyHistogram; |
| 93 | + |
| 94 | + // Replaces ['pulsar_ml_EntrySizeBuckets', 'pulsar_ml_EntrySizeBuckets_OVERFLOW', |
| 95 | + // 'pulsar_entry_size_*'] |
| 96 | + public static final String ENTRY_SIZE_HISTOGRAM = "pulsar.broker.managed_ledger.entry.size"; |
| 97 | + private final LongHistogram entrySizeHistogram; |
| 98 | + |
65 | 99 | public OpenTelemetryManagedLedgerStats(OpenTelemetry openTelemetry, ManagedLedgerFactoryImpl factory) { |
66 | 100 | var meter = openTelemetry.getMeter(Constants.BROKER_INSTRUMENTATION_SCOPE_NAME); |
67 | 101 |
|
@@ -124,6 +158,39 @@ public OpenTelemetryManagedLedgerStats(OpenTelemetry openTelemetry, ManagedLedge |
124 | 158 | bytesInCounter, |
125 | 159 | readEntryCacheMissCounter, |
126 | 160 | markDeleteCounter); |
| 161 | + |
| 162 | + addEntryLatencyHistogram = meter |
| 163 | + .histogramBuilder(ADD_ENTRY_LATENCY_HISTOGRAM) |
| 164 | + .setDescription("End-to-end write latency, including time spent in the executor queue.") |
| 165 | + .setUnit("s") |
| 166 | + .setExplicitBucketBoundariesAdvice(Arrays.asList(0.001, 0.005, 0.01, 0.02, 0.05, 0.1, |
| 167 | + 0.2, 0.5, 1.0, 5.0, 30.0)) |
| 168 | + .build(); |
| 169 | + |
| 170 | + ledgerAddEntryLatencyHistogram = meter |
| 171 | + .histogramBuilder(LEDGER_ADD_ENTRY_LATENCY_HISTOGRAM) |
| 172 | + .setDescription("End-to end write latency.") |
| 173 | + .setUnit("s") |
| 174 | + .setExplicitBucketBoundariesAdvice(Arrays.asList(0.001, 0.005, 0.01, 0.02, 0.05, 0.1, |
| 175 | + 0.2, 0.5, 1.0, 5.0, 30.0)) |
| 176 | + .build(); |
| 177 | + |
| 178 | + ledgerSwitchLatencyHistogram = meter |
| 179 | + .histogramBuilder(LEDGER_SWITCH_LATENCY_HISTOGRAM) |
| 180 | + .setDescription("Time taken to switch to a new ledger.") |
| 181 | + .setUnit("s") |
| 182 | + .setExplicitBucketBoundariesAdvice(Arrays.asList(0.001, 0.005, 0.01, 0.02, 0.05, 0.1, |
| 183 | + 0.2, 0.5, 1.0, 5.0, 30.0)) |
| 184 | + .build(); |
| 185 | + |
| 186 | + entrySizeHistogram = meter |
| 187 | + .histogramBuilder(ENTRY_SIZE_HISTOGRAM) |
| 188 | + .ofLongs() |
| 189 | + .setDescription("Size of entries written to the ledger.") |
| 190 | + .setUnit("By") |
| 191 | + .setExplicitBucketBoundariesAdvice(Arrays.asList(128L, 512L, 1024L, 2048L, 4096L, 16_384L, |
| 192 | + 102_400L, 1_048_576L)) |
| 193 | + .build(); |
127 | 194 | } |
128 | 195 |
|
129 | 196 | @Override |
@@ -151,4 +218,24 @@ private void recordMetrics(ManagedLedger ml) { |
151 | 218 | markDeleteCounter.record(stats.getMarkDeleteTotal(), attributes); |
152 | 219 | readEntryCacheMissCounter.record(stats.getReadEntriesOpsCacheMissesTotal(), attributes); |
153 | 220 | } |
| 221 | + |
| 222 | + void recordAddEntryLatency(long latency, TimeUnit unit, ManagedLedger ml) { |
| 223 | + final var attributes = ml.getManagedLedgerAttributes().getAttributesOnlyNamespace(); |
| 224 | + this.addEntryLatencyHistogram.record(unit.toMillis(latency) / 1000.0, attributes); |
| 225 | + } |
| 226 | + |
| 227 | + void recordLedgerAddEntryLatency(long latency, TimeUnit unit, ManagedLedger ml) { |
| 228 | + final var attributes = ml.getManagedLedgerAttributes().getAttributesOnlyNamespace(); |
| 229 | + this.ledgerAddEntryLatencyHistogram.record(unit.toMillis(latency) / 1000.0, attributes); |
| 230 | + } |
| 231 | + |
| 232 | + void recordLedgerSwitchLatency(long latency, TimeUnit unit, ManagedLedger ml) { |
| 233 | + final var attributes = ml.getManagedLedgerAttributes().getAttributesOnlyNamespace(); |
| 234 | + this.ledgerSwitchLatencyHistogram.record(unit.toMillis(latency) / 1000.0, attributes); |
| 235 | + } |
| 236 | + |
| 237 | + void recordEntrySize(long entrySize, ManagedLedger ml) { |
| 238 | + final var attributes = ml.getManagedLedgerAttributes().getAttributesOnlyNamespace(); |
| 239 | + this.entrySizeHistogram.record(entrySize, attributes); |
| 240 | + } |
154 | 241 | } |
0 commit comments