enabled telegraf again and set failsave configuration
This commit is contained in:
20
roles/server/files/telegraf.d/agent.conf
Normal file
20
roles/server/files/telegraf.d/agent.conf
Normal file
@@ -0,0 +1,20 @@
|
||||
###############################################################################
|
||||
# GLOBAL AGENT CONFIG
|
||||
###############################################################################
|
||||
[agent]
|
||||
## Erfassungsintervall
|
||||
interval = "10s"
|
||||
|
||||
## Batches kleiner halten → weniger RAM pro Batch
|
||||
metric_batch_size = 500
|
||||
metric_buffer_limit = 10000 # Maximal 10.000 Messpunkte im RAM
|
||||
|
||||
## Wenn der Buffer voll ist, werden alte Daten verworfen
|
||||
## → verhindert "Memory blowup"
|
||||
collection_jitter = "1s"
|
||||
flush_interval = "10s"
|
||||
flush_jitter = "2s"
|
||||
|
||||
## Jeder Output-Write versucht nur kurz, dann wird das Batch verworfen
|
||||
## → wichtig gegen RAM-Voll-Laufen
|
||||
round_interval = true
|
||||
11
roles/server/files/telegraf.d/output_file.conf
Normal file
11
roles/server/files/telegraf.d/output_file.conf
Normal file
@@ -0,0 +1,11 @@
|
||||
# --- FALLBACK: Metriken in Datei schreiben (optional, aber SEHR hilfreich) ---
|
||||
# Wird aktiviert, wenn du sicherstellen willst, dass keine Daten verloren gehen,
|
||||
# selbst wenn die InfluxDB tagelang offline ist.
|
||||
#
|
||||
# WICHTIG: Der File-Output belegt praktisch KEINEN RAM, da er direkt streamt.
|
||||
|
||||
[[outputs.file]]
|
||||
files = ["stdout", "/var/log/telegraf/metrics_backup.out"]
|
||||
rotation_interval = "1h"
|
||||
rotation_max_size = "100MB"
|
||||
rotation_max_archives = 5
|
||||
@@ -1,4 +1,17 @@
|
||||
[[outputs.influxdb]]
|
||||
urls = ["http://grafana.universe.local:8086"]
|
||||
database = "linux"
|
||||
|
||||
## Timeouts BEGRENZEN, damit der Puffer nicht endlos wächst
|
||||
timeout = "3s"
|
||||
username = "telegraf"
|
||||
password = "secret"
|
||||
|
||||
## Wenn die DB nicht erreichbar ist, nicht zu lange blockieren:
|
||||
## nur wenige Wiederholungen
|
||||
write_timeout = "3s"
|
||||
## Ab Telegraf 1.20+ sinnvoll:
|
||||
http_headers = { "Connection" = "close" }
|
||||
|
||||
## Fehler schnell melden → verhindert große Warteschlangen
|
||||
skip_database_creation = false
|
||||
@@ -8,7 +8,7 @@
|
||||
|
||||
- block:
|
||||
- include_tasks: utilities/mail_transfer_agent.yml
|
||||
# - include_tasks: utilities/telegraf.yml
|
||||
- include_tasks: utilities/telegraf.yml
|
||||
when: ansible_distribution in ["Debian", "Ubuntu", "Linux Mint"]
|
||||
- include_tasks: utilities/netdata.yml
|
||||
when: netdata is defined and netdata == true
|
||||
|
||||
@@ -27,11 +27,10 @@
|
||||
|
||||
- name: server | telegraf | copy basic config
|
||||
copy:
|
||||
dest: "/etc/telegraf/{{ item }}"
|
||||
dest: "/etc/telegraf/telegraf.d/{{ item | basename }}"
|
||||
src: "{{ item }}"
|
||||
loop:
|
||||
- telegraf.d/input_basics.conf
|
||||
- telegraf.d/output_influx.conf
|
||||
with_fileglob:
|
||||
- "telegraf.d/*.conf"
|
||||
notify: restart_telegraf
|
||||
|
||||
|
||||
Reference in New Issue
Block a user