This repository has been archived on 2025-09-14. You can view files and clone it, but cannot push or open issues or pull requests.
Files
tango-tsgx-hardware/NEZHA/deprecated/alert-rule.json

362 lines
12 KiB
JSON

[
{
"Name":"TSG-X_firewall_container_status",
"Type":"1",
"Evaluation interval ":"0",
"Timeout(s)":"300",
"Expression/OID":"kube_pod_container_status_running{project=\"TSG-X\",container=\"firewall\"}",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"!=\",\"value\":\"1.0\"}]",
"Extension Label":"",
"Unit":"short",
"Duration (s)":"60",
"Summary":"Container firewall status is not running.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_proxy_container_status",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"kube_pod_container_status_running{project=\"TSG-X\",container=\"proxy\"}",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"!=\",\"value\":\"1.0\"}]",
"Extension Label":"",
"Unit":"short",
"Duration (s)":"60",
"Summary":"Container proxy status is not running.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_certstore_container_status",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"kube_pod_container_status_running{project=\"TSG-X\",container=\"certstore\"}",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"!=\",\"value\":\"1.0\"}]",
"Extension Label":"",
"Unit":"short",
"Duration (s)":"60",
"Summary":"Container certstore process != 1.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_cert_redis_container_status",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"kube_pod_container_status_running{project=\"TSG-X\",container=\"cert-redis\"}",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"!=\",\"value\":\"1.0\"}]",
"Extension Label":"",
"Unit":"short",
"Duration (s)":"60",
"Summary":"Container cert-redis status is not running.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_telegraf_container_status",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"kube_pod_container_status_running{project=\"TSG-X\",container=\"telegraf\"}",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"!=\",\"value\":\"1.0\"}]",
"Extension Label":"",
"Unit":"short",
"Duration (s)":"60",
"Summary":"Container telegraf status is not running.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_traffic_steering_too_high",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"irate(phy_rx_bits_total{project=\"TSG-X\",dev!~\"virtio_dign_(.*)\"}[1m])\n",
"Condition":"[{\"id\":2,\"weight\":1,\"operator\":\">=\",\"value\":\"160000000000\"}]",
"Extension Label":"",
"Unit":"bits/sec",
"Duration (s)":"60",
"Summary":"Physical trafific steering to high.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_packet_io_rx_missed",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"irate(phy_rx_missed_total{project=\"TSG-X\",dev!~\"virtio_dign_(.*)\"}[1m])",
"Condition":"[{\"id\":2,\"weight\":1,\"operator\":\">\",\"value\":\"0.0\"}]",
"Extension Label":"",
"Unit":"packets/sec",
"Duration (s)":"60",
"Summary":"Packet drops by NIC cards.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_packet_io_rx_error",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"irate(phy_rx_error_total{project=\"TSG-X\",dev!~\"virtio_dign_(.*)\"}[1m])",
"Condition":"[{\"id\":2,\"weight\":1,\"operator\":\">\",\"value\":\"0.0\"}]",
"Extension Label":"",
"Unit":"packets/sec",
"Duration (s)":"60",
"Summary":"Packet drops by CRC errors.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_physical_component_too_hot",
"Type":"1",
"Evaluation interval ":"0",
"Timeout(s)":"300",
"Expression/OID":"node_hwmon_temp_celsius{project=\"TSG-X\"}",
"Condition":"[{\"id\":3,\"weight\":1,\"operator\":\">\",\"value\":\"75.0\"}]",
"Extension Label":"",
"Unit":"short",
"Duration (s)":"60",
"Summary":"Host physical component too hot (instance {{ $labels.instance }})",
"Description":"Physical hardware component too hot\nVALUE = {{ $value }}\nLABELS: {{ $labels }}",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_node_memory_pressure",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"kube_node_status_condition{condition=\"MemoryPressure\",status=\"true\"}",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"==\",\"value\":\"1.0\"}]",
"Extension Label":"",
"Unit":"short",
"Duration (s)":"60",
"Summary":"Node memory pressure (instance {{ $labels.instance }})",
"Description":"{{ $labels.node }} has MemoryPressure condition\\n VALUE = {{ $value }}\\n LABELS = {{ $labels }}",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_node_disk_pressure",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"kube_node_status_condition{condition=\"DiskPressure\",status=\"true\"}",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"==\",\"value\":\"1.0\"}]",
"Extension Label":"",
"Unit":"short",
"Duration (s)":"60",
"Summary":"Node disk pressure (instance {{ $labels.instance }})",
"Description":"{{ $labels.node }} has DiskPressure condition\\n VALUE = {{ $value }}\\n LABELS = {{ $labels }}",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_host_high_cpu_load",
"Type":"1",
"Evaluation interval ":"0",
"Timeout(s)":"300",
"Expression/OID":"100 - (avg by(instance) (rate(node_cpu_seconds_total{mode=\"idle\"}[2m])) * 100) > 80",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\">\",\"value\":\"80.0\"}]",
"Extension Label":"",
"Unit":"percent(0-100)",
"Duration (s)":"60",
"Summary":"Host high CPU load (instance {{ $labels.instance }})",
"Description":"CPU load is > 80%\\n VALUE = {{ $value }}\\n LABELS = {{ $labels }}",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_packet_io_rxdrop",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"irate(rx_drops_total{project=\"TSG-X\"}[1m])",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\">\",\"value\":\"0.0\"}]",
"Extension Label":"",
"Unit":"packets/sec",
"Duration (s)":"60",
"Summary":"Packet drops by application for the poor performance.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_packet_tx_missed",
"Type":"1",
"Evaluation interval ":"60",
"Timeout(s)":"300",
"Expression/OID":"phy_tx_error_total{project=\"TSG-X\"}",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\">\",\"value\":\"0.0\"}]",
"Extension Label":"",
"Unit":"packets/sec",
"Duration (s)":"60",
"Summary":"Packet I/O TX missed.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
},
{
"Name":"TSG-X_packet_io_tx_drops",
"Type":"1",
"Evaluation interval ":"0",
"Timeout(s)":"300",
"Expression/OID":"irate(tx_drops_total{project=\"TSG-X\"}[1m]) + irate(ftx_missed_total{project=\"TSG-X\"}[1m])",
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\">\",\"value\":\"0.0\"}]",
"Extension Label":"",
"Unit":"short",
"Duration (s)":"60",
"Summary":"Packet TX Drops by applicaton poor performance.",
"Description":"",
"Receiver":"",
"Notices":"",
"State":"1",
"Automatic expired":"1",
"Schedule":"0",
"Effective times":"",
"Start time":"00:00",
"End time":"23:59",
"Active notification":"0",
"Expired notification":"0",
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
}
]