362 lines
12 KiB
JSON
362 lines
12 KiB
JSON
[
|
|
{
|
|
"Name":"TSG-X_firewall_container_status",
|
|
"Type":"1",
|
|
"Evaluation interval ":"0",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"kube_pod_container_status_running{project=\"TSG-X\",container=\"firewall\"}",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"!=\",\"value\":\"1.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"short",
|
|
"Duration (s)":"60",
|
|
"Summary":"Container firewall status is not running.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_proxy_container_status",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"kube_pod_container_status_running{project=\"TSG-X\",container=\"proxy\"}",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"!=\",\"value\":\"1.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"short",
|
|
"Duration (s)":"60",
|
|
"Summary":"Container proxy status is not running.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_certstore_container_status",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"kube_pod_container_status_running{project=\"TSG-X\",container=\"certstore\"}",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"!=\",\"value\":\"1.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"short",
|
|
"Duration (s)":"60",
|
|
"Summary":"Container certstore process != 1.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_cert_redis_container_status",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"kube_pod_container_status_running{project=\"TSG-X\",container=\"cert-redis\"}",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"!=\",\"value\":\"1.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"short",
|
|
"Duration (s)":"60",
|
|
"Summary":"Container cert-redis status is not running.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_telegraf_container_status",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"kube_pod_container_status_running{project=\"TSG-X\",container=\"telegraf\"}",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"!=\",\"value\":\"1.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"short",
|
|
"Duration (s)":"60",
|
|
"Summary":"Container telegraf status is not running.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_traffic_steering_too_high",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"irate(phy_rx_bits_total{project=\"TSG-X\",dev!~\"virtio_dign_(.*)\"}[1m])\n",
|
|
"Condition":"[{\"id\":2,\"weight\":1,\"operator\":\">=\",\"value\":\"160000000000\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"bits/sec",
|
|
"Duration (s)":"60",
|
|
"Summary":"Physical trafific steering to high.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_packet_io_rx_missed",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"irate(phy_rx_missed_total{project=\"TSG-X\",dev!~\"virtio_dign_(.*)\"}[1m])",
|
|
"Condition":"[{\"id\":2,\"weight\":1,\"operator\":\">\",\"value\":\"0.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"packets/sec",
|
|
"Duration (s)":"60",
|
|
"Summary":"Packet drops by NIC cards.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_packet_io_rx_error",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"irate(phy_rx_error_total{project=\"TSG-X\",dev!~\"virtio_dign_(.*)\"}[1m])",
|
|
"Condition":"[{\"id\":2,\"weight\":1,\"operator\":\">\",\"value\":\"0.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"packets/sec",
|
|
"Duration (s)":"60",
|
|
"Summary":"Packet drops by CRC errors.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_physical_component_too_hot",
|
|
"Type":"1",
|
|
"Evaluation interval ":"0",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"node_hwmon_temp_celsius{project=\"TSG-X\"}",
|
|
"Condition":"[{\"id\":3,\"weight\":1,\"operator\":\">\",\"value\":\"75.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"short",
|
|
"Duration (s)":"60",
|
|
"Summary":"Host physical component too hot (instance {{ $labels.instance }})",
|
|
"Description":"Physical hardware component too hot\nVALUE = {{ $value }}\nLABELS: {{ $labels }}",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_node_memory_pressure",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"kube_node_status_condition{condition=\"MemoryPressure\",status=\"true\"}",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"==\",\"value\":\"1.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"short",
|
|
"Duration (s)":"60",
|
|
"Summary":"Node memory pressure (instance {{ $labels.instance }})",
|
|
"Description":"{{ $labels.node }} has MemoryPressure condition\\n VALUE = {{ $value }}\\n LABELS = {{ $labels }}",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_node_disk_pressure",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"kube_node_status_condition{condition=\"DiskPressure\",status=\"true\"}",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\"==\",\"value\":\"1.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"short",
|
|
"Duration (s)":"60",
|
|
"Summary":"Node disk pressure (instance {{ $labels.instance }})",
|
|
"Description":"{{ $labels.node }} has DiskPressure condition\\n VALUE = {{ $value }}\\n LABELS = {{ $labels }}",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_host_high_cpu_load",
|
|
"Type":"1",
|
|
"Evaluation interval ":"0",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"100 - (avg by(instance) (rate(node_cpu_seconds_total{mode=\"idle\"}[2m])) * 100) > 80",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\">\",\"value\":\"80.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"percent(0-100)",
|
|
"Duration (s)":"60",
|
|
"Summary":"Host high CPU load (instance {{ $labels.instance }})",
|
|
"Description":"CPU load is > 80%\\n VALUE = {{ $value }}\\n LABELS = {{ $labels }}",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_packet_io_rxdrop",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"irate(rx_drops_total{project=\"TSG-X\"}[1m])",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\">\",\"value\":\"0.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"packets/sec",
|
|
"Duration (s)":"60",
|
|
"Summary":"Packet drops by application for the poor performance.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_packet_tx_missed",
|
|
"Type":"1",
|
|
"Evaluation interval ":"60",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"phy_tx_error_total{project=\"TSG-X\"}",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\">\",\"value\":\"0.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"packets/sec",
|
|
"Duration (s)":"60",
|
|
"Summary":"Packet I/O TX missed.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
},
|
|
{
|
|
"Name":"TSG-X_packet_io_tx_drops",
|
|
"Type":"1",
|
|
"Evaluation interval ":"0",
|
|
"Timeout(s)":"300",
|
|
"Expression/OID":"irate(tx_drops_total{project=\"TSG-X\"}[1m]) + irate(ftx_missed_total{project=\"TSG-X\"}[1m])",
|
|
"Condition":"[{\"id\":1,\"weight\":1,\"operator\":\">\",\"value\":\"0.0\"}]",
|
|
"Extension Label":"",
|
|
"Unit":"short",
|
|
"Duration (s)":"60",
|
|
"Summary":"Packet TX Drops by applicaton poor performance.",
|
|
"Description":"",
|
|
"Receiver":"",
|
|
"Notices":"",
|
|
"State":"1",
|
|
"Automatic expired":"1",
|
|
"Schedule":"0",
|
|
"Effective times":"",
|
|
"Start time":"00:00",
|
|
"End time":"23:59",
|
|
"Active notification":"0",
|
|
"Expired notification":"0",
|
|
"Trouble shooting":"<div class=\"editor-core ql-container ql-snow\"><div class=\"ql-editor\"><p><br></p></div></div>"
|
|
}
|
|
] |