Различия
Показаны различия между двумя версиями страницы.
| Предыдущая версия справа и слева Предыдущая версия Следующая версия | Предыдущая версия | ||
| software:monitoring [2025/11/15 05:15] – [promtail_config] 192.168.1.159 | software:monitoring [2025/12/07 02:38] (текущий) – [Программные средства] mirocow | ||
|---|---|---|---|
| Строка 1: | Строка 1: | ||
| - | {{tag> | + | {{tag> |
| - | ====== | + | ====== |
| - | ===== Версии: ===== | + | {{:software:67567.jpg?600|}} |
| - | + | ||
| - | * grafana/ | + | |
| - | * grafana/ | + | |
| - | * grafana/ | + | |
| - | ===== Настройки | + | Мониторинг IT-инфраструктуры (ИТ-мониторинг) — это процесс постоянного сбора, обработки и анализа данных о состоянии элементов ИТ-среды: |
| - | ==== loki_config ==== | + | * Минимизация времени простоя — быстрая реакция на проблемы (перезапуск служб, уведомление администраторов, |
| + | * Снижение операционных расходов — автоматизация контроля сети, серверов, | ||
| + | * Улучшение пользовательского опыта — стабильная работа систем влияет на удовлетворённость клиентов и сотрудников, | ||
| + | * Планирование развития инфраструктуры — анализ исторических данных и трендов позволяет прогнозировать будущие потребности в ресурсах и планировать развитие ИТ-инфраструктуры. | ||
| - | <code yaml> | + | ===== Программы ===== |
| - | auth_enabled: | + | |
| - | server: | + | Grafana, Promtail, Loki, Prometheus, Fluent Bit, Fluentd, Kibana, Logstah, Elasticsearch, |
| - | http_listen_port: | + | |
| - | grpc_listen_port: | + | |
| - | log_level: info | + | |
| - | # Таймауты для стабильности | + | |
| - | http_server_read_timeout: | + | |
| - | http_server_write_timeout: | + | |
| - | common: | + | ==== Рекомендации ==== |
| - | path_prefix: | + | |
| - | storage: | + | |
| - | filesystem: | + | |
| - | chunks_directory: | + | |
| - | rules_directory: | + | |
| - | replication_factor: | + | |
| - | ring: | + | |
| - | instance_addr: | + | |
| - | kvstore: | + | |
| - | store: inmemory | + | |
| - | # Критически важные настройки для | + | * Использовать Fluentd |
| - | query_scheduler: | + | |
| - | max_outstanding_requests_per_tenant: | + | |
| - | frontend: | + | ===== Программные средства ===== |
| - | # Параметр max_outstanding_per_tenant удален из этой | + | |
| - | log_queries_longer_than: | + | |
| - | compress_responses: | + | |
| - | query_range: | ||
| - | parallelise_shardable_queries: | ||
| - | results_cache: | ||
| - | cache: | ||
| - | embedded_cache: | ||
| - | enabled: true | ||
| - | max_size_mb: | ||
| - | max_retries: | ||
| - | limits_config: | + | * [[system:universal]] |
| - | | + | |
| - | query_timeout: 5m | + | |
| - | | + | |
| - | ingestion_rate_mb: 1000 | + | |
| - | ingestion_burst_size_mb: | + | |
| - | max_line_size: | + | |
| - | reject_old_samples: | + | |
| - | reject_old_samples_max_age: | + | |
| - | max_entries_limit_per_query: | + | |
| - | retention_period: | + | |
| - | max_query_length: | + | |
| - | max_query_parallelism: | + | |
| - | + | | |
| - | schema_config: | + | |
| - | configs: | + | |
| - | | + | |
| - | store: tsdb | + | * [[system:watch]] |
| - | object_store: | + | |
| - | schema: v13 | + | |
| - | index: | + | |
| - | prefix: index_ | + | |
| - | period: 24h | + | |
| - | + | ||
| - | ingester: | + | |
| - | | + | |
| - | enabled: true | + | |
| - | dir: /loki/wal | + | |
| - | flush_on_shutdown: | + | |
| - | lifecycler: | + | |
| - | ring: | + | |
| - | kvstore: | + | |
| - | store: inmemory | + | |
| - | replication_factor: | + | |
| - | heartbeat_timeout: | + | |
| - | chunk_idle_period: | + | |
| - | max_chunk_age: | + | |
| - | chunk_target_size: | + | |
| - | chunk_retain_period: | + | |
| - | + | ||
| - | storage_config: | + | |
| - | tsdb_shipper: | + | |
| - | active_index_directory: | + | |
| - | cache_location: | + | |
| - | filesystem: | + | |
| - | directory: / | + | |
| - | + | ||
| - | compactor: | + | |
| - | working_directory: | + | |
| - | | + | |
| - | | + | |
| - | | + | |
| - | | + | |
| - | | + | |
| - | + | ||
| - | + | ||
| - | querier: | + | |
| - | | + | |
| - | | + | |
| - | + | ||
| - | analytics: | + | |
| - | | + | |
| - | </ | + | |
| - | + | ||
| - | ==== promtail_config ==== | + | |
| - | + | ||
| - | <code yaml> | + | |
| - | server: | + | |
| - | | + | |
| - | | + | |
| - | + | ||
| - | positions: | + | |
| - | | + | |
| - | | + | |
| - | sync_period: | + | |
| - | + | ||
| - | clients: | + | |
| - | | + | |
| - | backoff_config: | + | |
| - | min_period: 10s | + | |
| - | max_period: 5m | + | |
| - | max_retries: | + | |
| - | batchwait: 30s | + | |
| - | batchsize: 2097152 | + | |
| - | timeout: 60s | + | |
| - | external_labels: | + | |
| - | cluster: docker-swarm | + | |
| - | host: " | + | |
| - | + | ||
| - | scrape_configs: | + | |
| - | + | ||
| - | - job_name: docker_containers | + | |
| - | docker_sd_configs: | + | |
| - | - host: unix:/// | + | |
| - | refresh_interval: | + | |
| - | filters: | + | |
| - | - name: status | + | |
| - | values: [" | + | |
| - | relabel_configs: | + | |
| - | - target_label: | + | |
| - | replacement: | + | |
| - | - source_labels: | + | |
| - | | + | |
| - | target_label: | + | |
| - | action: replace | + | |
| - | - source_labels: | + | |
| - | target_label: | + | |
| - | regex: " | + | |
| - | action: keep | + | |
| - | - source_labels: | + | |
| - | target_label: swarm_service_name | + | |
| - | - source_labels: | + | |
| - | target_label: | + | |
| - | action: replace | + | |
| - | - source_labels: | + | |
| - | | + | |
| - | action: replace | + | |
| - | - source_labels: | + | |
| - | target_label: | + | |
| - | action: replace | + | |
| - | - source_labels: | + | |
| - | target_label: log_stream | + | |
| - | action: replace | + | |
| - | - source_labels: | + | |
| - | target_label: | + | |
| - | action: replace | + | |
| - | - source_labels: | + | |
| - | target_label: | + | |
| - | action: replace | + | |
| - | # Правило дропа для тестирования | + | |
| - | # - source_labels: | + | |
| - | # | + | |
| - | # | + | |
| - | pipeline_stages: | + | |
| - | - docker: {} | + | |
| - | - timestamp: | + | |
| - | source: current_time | + | |
| - | format: RFC3339 | + | |
| - | + | ||
| - | | + | |
| - | journal: | + | |
| - | max_age: 24h | + | |
| - | path: / | + | |
| - | labels: | + | |
| - | job: systemd_journal | + | |
| - | relabel_configs: | + | |
| - | - source_labels: | + | |
| - | target_label: | + | |
| - | - source_labels: | + | |
| - | target_label: unit | + | |
| - | - source_labels: | + | |
| - | target_label: | + | |
| - | pipeline_stages: | + | |
| - | - timestamp: | + | |
| - | source: current_time | + | |
| - | format: RFC3339 | + | |
| - | </ | + | |
| - | + | ||
| - | ===== Docker Compose ===== | + | |
| - | + | ||
| - | + | ||
| - | monitoring | + | |
| - | <code yaml> | + | |
| - | version: " | + | |
| - | + | ||
| - | services: | + | |
| - | + | ||
| - | | + | |
| - | image: grafana/ | + | |
| - | ports: | + | |
| - | - " | + | |
| - | configs: | + | |
| - | - source: loki_config | + | |
| - | target: / | + | |
| - | volumes: | + | |
| - | - loki_data:/ | + | |
| - | - / | + | |
| - | - / | + | |
| - | command: | + | |
| - | - -config.file=/ | + | |
| - | - -config.expand-env=true | + | |
| - | - -target=all | + | |
| - | networks: | + | |
| - | - monitoring | + | |
| - | deploy: | + | |
| - | placement: | + | |
| - | constraints: | + | |
| - | - node.role == manager | + | |
| - | resources: | + | |
| - | limits: | + | |
| - | memory: 2G # Уменьшаем память | + | |
| - | cpus: ' | + | |
| - | reservations: | + | |
| - | memory: 1G | + | |
| - | cpus: ' | + | |
| - | restart_policy: | + | |
| - | condition: on-failure | + | |
| - | delay: 10s | + | |
| - | max_attempts: | + | |
| - | + | ||
| - | | + | |
| - | image: grafana/ | + | |
| - | configs: | + | |
| - | - source: promtail_config | + | |
| - | target: / | + | |
| - | volumes: | + | |
| - | - / | + | |
| - | - / | + | |
| - | - / | + | |
| - | - / | + | |
| - | - / | + | |
| - | - promtail_positions:/ | + | |
| - | - / | + | |
| - | - / | + | |
| - | command: | + | |
| - | - -config.file=/ | + | |
| - | - -client.external-labels=host=${HOSTNAME} | + | |
| - | - -config.expand-env=true | + | |
| - | #- -log.level=info | + | |
| - | environment: | + | |
| - | - HOSTNAME={{.Node.Hostname}} | + | |
| - | networks: | + | |
| - | - monitoring | + | |
| - | deploy: | + | |
| - | mode: global | + | |
| - | resources: | + | |
| - | limits: | + | |
| - | memory: 512M | + | |
| - | cpus: ' | + | |
| - | reservations: | + | |
| - | memory: 256M | + | |
| - | cpus: ' | + | |
| - | restart_policy: | + | |
| - | condition: any | + | |
| - | delay: 30s | + | |
| - | max_attempts: | + | |
| - | + | ||
| - | | + | |
| - | image: grafana/ | + | |
| - | ports: | + | |
| - | - " | + | |
| - | environment: | + | |
| - | - GF_SECURITY_ADMIN_PASSWORD=admin | + | |
| - | - GF_SECURITY_ADMIN_USER=admin | + | |
| - | - GF_USERS_ALLOW_SIGN_UP=false | + | |
| - | volumes: | + | |
| - | - grafana_data:/ | + | |
| - | - / | + | |
| - | - / | + | |
| - | networks: | + | |
| - | - monitoring | + | |
| - | deploy: | + | |
| - | placement: | + | |
| - | constraints: | + | |
| - | | + | |
| - | resources: | + | |
| - | limits: | + | |
| - | memory: 512M | + | |
| - | cpus: ' | + | |
| - | reservations: | + | |
| - | memory: 256M | + | |
| - | cpus: ' | + | |
| - | + | ||
| - | configs: | + | |
| - | | + | |
| - | external: true | + | |
| - | promtail_config: | + | |
| - | external: true | + | |
| - | + | ||
| - | networks: | + | |
| - | monitoring: | + | |
| - | driver: overlay | + | |
| - | attachable: true | + | |
| - | + | ||
| - | + | ||
| - | volumes: | + | |
| - | promtail_positions: | + | |
| - | driver: local | + | |
| - | loki_data: | + | |
| - | driver: local | + | |
| - | grafana_data: | + | |
| - | driver: local | + | |
| - | </ | + | |