enabled telegraf again and set failsave configuration
This commit is contained in:
20
roles/server/files/telegraf.d/agent.conf
Normal file
20
roles/server/files/telegraf.d/agent.conf
Normal file
@@ -0,0 +1,20 @@
|
|||||||
|
###############################################################################
|
||||||
|
# GLOBAL AGENT CONFIG
|
||||||
|
###############################################################################
|
||||||
|
[agent]
|
||||||
|
## Erfassungsintervall
|
||||||
|
interval = "10s"
|
||||||
|
|
||||||
|
## Batches kleiner halten → weniger RAM pro Batch
|
||||||
|
metric_batch_size = 500
|
||||||
|
metric_buffer_limit = 10000 # Maximal 10.000 Messpunkte im RAM
|
||||||
|
|
||||||
|
## Wenn der Buffer voll ist, werden alte Daten verworfen
|
||||||
|
## → verhindert "Memory blowup"
|
||||||
|
collection_jitter = "1s"
|
||||||
|
flush_interval = "10s"
|
||||||
|
flush_jitter = "2s"
|
||||||
|
|
||||||
|
## Jeder Output-Write versucht nur kurz, dann wird das Batch verworfen
|
||||||
|
## → wichtig gegen RAM-Voll-Laufen
|
||||||
|
round_interval = true
|
||||||
11
roles/server/files/telegraf.d/output_file.conf
Normal file
11
roles/server/files/telegraf.d/output_file.conf
Normal file
@@ -0,0 +1,11 @@
|
|||||||
|
# --- FALLBACK: Metriken in Datei schreiben (optional, aber SEHR hilfreich) ---
|
||||||
|
# Wird aktiviert, wenn du sicherstellen willst, dass keine Daten verloren gehen,
|
||||||
|
# selbst wenn die InfluxDB tagelang offline ist.
|
||||||
|
#
|
||||||
|
# WICHTIG: Der File-Output belegt praktisch KEINEN RAM, da er direkt streamt.
|
||||||
|
|
||||||
|
[[outputs.file]]
|
||||||
|
files = ["stdout", "/var/log/telegraf/metrics_backup.out"]
|
||||||
|
rotation_interval = "1h"
|
||||||
|
rotation_max_size = "100MB"
|
||||||
|
rotation_max_archives = 5
|
||||||
@@ -1,4 +1,17 @@
|
|||||||
[[outputs.influxdb]]
|
[[outputs.influxdb]]
|
||||||
urls = ["http://grafana.universe.local:8086"]
|
urls = ["http://grafana.universe.local:8086"]
|
||||||
database = "linux"
|
database = "linux"
|
||||||
|
|
||||||
|
## Timeouts BEGRENZEN, damit der Puffer nicht endlos wächst
|
||||||
|
timeout = "3s"
|
||||||
|
username = "telegraf"
|
||||||
|
password = "secret"
|
||||||
|
|
||||||
|
## Wenn die DB nicht erreichbar ist, nicht zu lange blockieren:
|
||||||
|
## nur wenige Wiederholungen
|
||||||
|
write_timeout = "3s"
|
||||||
|
## Ab Telegraf 1.20+ sinnvoll:
|
||||||
|
http_headers = { "Connection" = "close" }
|
||||||
|
|
||||||
|
## Fehler schnell melden → verhindert große Warteschlangen
|
||||||
skip_database_creation = false
|
skip_database_creation = false
|
||||||
@@ -8,7 +8,7 @@
|
|||||||
|
|
||||||
- block:
|
- block:
|
||||||
- include_tasks: utilities/mail_transfer_agent.yml
|
- include_tasks: utilities/mail_transfer_agent.yml
|
||||||
# - include_tasks: utilities/telegraf.yml
|
- include_tasks: utilities/telegraf.yml
|
||||||
when: ansible_distribution in ["Debian", "Ubuntu", "Linux Mint"]
|
when: ansible_distribution in ["Debian", "Ubuntu", "Linux Mint"]
|
||||||
- include_tasks: utilities/netdata.yml
|
- include_tasks: utilities/netdata.yml
|
||||||
when: netdata is defined and netdata == true
|
when: netdata is defined and netdata == true
|
||||||
|
|||||||
@@ -27,11 +27,10 @@
|
|||||||
|
|
||||||
- name: server | telegraf | copy basic config
|
- name: server | telegraf | copy basic config
|
||||||
copy:
|
copy:
|
||||||
dest: "/etc/telegraf/{{ item }}"
|
dest: "/etc/telegraf/telegraf.d/{{ item | basename }}"
|
||||||
src: "{{ item }}"
|
src: "{{ item }}"
|
||||||
loop:
|
with_fileglob:
|
||||||
- telegraf.d/input_basics.conf
|
- "telegraf.d/*.conf"
|
||||||
- telegraf.d/output_influx.conf
|
|
||||||
notify: restart_telegraf
|
notify: restart_telegraf
|
||||||
|
|
||||||
|
|
||||||
Reference in New Issue
Block a user