blob: a73ce541a3ece15d9497a4b89a0b43ce20e960cd [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.dolphinscheduler.server.worker.metrics;
import java.util.concurrent.TimeUnit;
import java.util.function.Supplier;
import lombok.experimental.UtilityClass;
import io.micrometer.core.instrument.Counter;
import io.micrometer.core.instrument.DistributionSummary;
import io.micrometer.core.instrument.Gauge;
import io.micrometer.core.instrument.Metrics;
import io.micrometer.core.instrument.Timer;
@UtilityClass
public class WorkerServerMetrics {
private final Counter workerOverloadCounter =
Counter.builder("ds.worker.overload.count")
.description("overloaded workers count")
.register(Metrics.globalRegistry);
private final Counter workerFullSubmitQueueCounter =
Counter.builder("ds.worker.full.submit.queue.count")
.description("full worker submit queues count")
.register(Metrics.globalRegistry);
private final Counter workerResourceDownloadSuccessCounter =
Counter.builder("ds.worker.resource.download.count")
.tag("status", "success")
.description("worker resource download success count")
.register(Metrics.globalRegistry);
private final Counter workerResourceDownloadFailCounter =
Counter.builder("ds.worker.resource.download.count")
.tag("status", "fail")
.description("worker resource download failure count")
.register(Metrics.globalRegistry);
private final Timer workerResourceDownloadDurationTimer =
Timer.builder("ds.worker.resource.download.duration")
.publishPercentiles(0.5, 0.75, 0.95, 0.99)
.publishPercentileHistogram()
.description("time cost of resource download on workers")
.register(Metrics.globalRegistry);
private final DistributionSummary workerResourceDownloadSizeDistribution =
DistributionSummary.builder("ds.worker.resource.download.size")
.baseUnit("bytes")
.publishPercentiles(0.5, 0.75, 0.95, 0.99)
.publishPercentileHistogram()
.description("size of downloaded resource files on worker")
.register(Metrics.globalRegistry);
public void incWorkerOverloadCount() {
workerOverloadCounter.increment();
}
public void incWorkerSubmitQueueIsFullCount() {
workerFullSubmitQueueCounter.increment();
}
public void incWorkerResourceDownloadSuccessCount() {
workerResourceDownloadSuccessCounter.increment();
}
public void incWorkerResourceDownloadFailureCount() {
workerResourceDownloadFailCounter.increment();
}
public void recordWorkerResourceDownloadTime(final long milliseconds) {
workerResourceDownloadDurationTimer.record(milliseconds, TimeUnit.MILLISECONDS);
}
public void recordWorkerResourceDownloadSize(final long size) {
workerResourceDownloadSizeDistribution.record(size);
}
public void registerWorkerTaskTotalGauge(final Supplier<Number> supplier) {
Gauge.builder("ds.worker.task", supplier)
.description("total number of tasks on worker")
.register(Metrics.globalRegistry);
}
public void registerWorkerExecuteQueueSizeGauge(Supplier<Number> supplier) {
Gauge.builder("ds.worker.execute.queue.size", supplier)
.description("worker execute queue size")
.register(Metrics.globalRegistry);
}
public void registerWorkerActiveExecuteThreadGauge(Supplier<Number> supplier) {
Gauge.builder("ds.worker.active.execute.thread", supplier)
.description("number of active task execute threads on worker")
.register(Metrics.globalRegistry);
}
public void registerWorkerMemoryAvailableGauge(Supplier<Number> supplier) {
Gauge.builder("ds.worker.memory.available", supplier)
.description("worker memory available")
.register(Metrics.globalRegistry);
}
public void registerWorkerCpuUsageGauge(Supplier<Number> supplier) {
Gauge.builder("ds.worker.cpu.usage", supplier)
.description("worker cpu usage")
.register(Metrics.globalRegistry);
}
public void registerWorkerMemoryUsageGauge(Supplier<Number> supplier) {
Gauge.builder("ds.worker.memory.usage", supplier)
.description("worker memory usage")
.register(Metrics.globalRegistry);
}
}