Skip to content
Snippets Groups Projects
Commit 3e564120 authored by Jan David Mol's avatar Jan David Mol
Browse files

more reasonable buckets for transfer durations

parent e0cd9829
No related branches found
No related tags found
1 merge request!1458Add custom monitoring points to LTA ingest, TMSS backend, and scheduling service
......@@ -7,7 +7,7 @@ import random
import socket
import re
import getpass
from prometheus_client import Gauge, Counter
from prometheus_client import Gauge, Counter, Histogram, INF
from lofar.lta.ingest.common.job import *
from lofar.lta.ingest.server.sip import validateSIPAgainstSchema, addIngestInfoToSIP
......@@ -29,7 +29,8 @@ logger = logging.getLogger(__name__)
#---------------------- Prometheus Metrics ----------------------------------------
metric_nr_transfers_in_progress = Gauge("ingest_transfers_in_progress", "Count how many transfers are currently in progress", labelnames=["site"])
metric_transfer_durations = Histogram("ingest_transfer_durations", "How long transfers are taking", labelnames=["site"])
metric_transfer_durations = Histogram("ingest_transfer_durations", "How long transfers are taking", labelnames=["site"],
buckets=(1.0, 10.0, 60.0, 5 * 60.0, 10 * 60.0, 30 * 60.0, 3600.0, 2 * 3600.0, 4 * 3600.0, 8 * 3600.0, 12 * 3600.0, 24 * 3600.0, INF))
metric_nr_transfer_exceptions = Counter("ingest_transfer_exceptions", "Number of exceptions raised during transfer", labelnames=["site", "reason"])
metric_nr_bytes_transferred = Counter("ingest_bytes_ingested", "Number of payload bytes ingested into the LTA (sum of ingested file sizes)", labelnames=["site"])
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment