Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 1 | #!/usr/bin/env python |
| 2 | |
| 3 | # Copyright 2020-present Open Networking Foundation |
| 4 | # |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 5 | # SPDX-License-Identifier: LicenseRef-ONF-Member-Only-1.0 |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 6 | |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 7 | import os |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 8 | import time |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 9 | import datetime |
| 10 | import pytz |
| 11 | import threading |
| 12 | from icalevents.icalevents import events |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 13 | from flask import Flask, jsonify, abort, request, Response |
| 14 | import prometheus_client as prom |
Andy Bavier | 2d60fc5 | 2021-05-04 16:13:39 -0700 | [diff] [blame] | 15 | import jsonschema |
Andy Bavier | 55dc587 | 2021-05-05 11:31:42 -0700 | [diff] [blame] | 16 | from logging.config import dictConfig |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 17 | |
Andy Bavier | 8a5c987 | 2020-10-21 13:17:53 -0700 | [diff] [blame] | 18 | # URL of maintenance calendar |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 19 | SECRET_ICAL_URL = os.environ.get("SECRET_ICAL_URL") |
Andy Bavier | 8a5c987 | 2020-10-21 13:17:53 -0700 | [diff] [blame] | 20 | |
| 21 | # Aether environment that the server is monitoring (e.g., "production") |
| 22 | # To schedule downtime, postfix the cluster name with the env: "ace-tucson-production" |
| 23 | AETHER_ENV = os.environ.get("AETHER_ENV", "production") |
| 24 | |
| 25 | # Move to "no result" status if we don't hear from agent for this many seconds |
Jeremy Ronquillo | 56d23b1 | 2021-12-02 14:57:42 -0800 | [diff] [blame] | 26 | NO_RESULT_THRESHOLD = 360 |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 27 | |
Andy Bavier | 55dc587 | 2021-05-05 11:31:42 -0700 | [diff] [blame] | 28 | dictConfig({ |
| 29 | 'version': 1, |
| 30 | 'formatters': {'default': { |
Andy Bavier | 41fef77 | 2021-05-12 13:48:42 -0700 | [diff] [blame] | 31 | 'format': '%(levelname)s %(message)s', |
Andy Bavier | 55dc587 | 2021-05-05 11:31:42 -0700 | [diff] [blame] | 32 | }}, |
| 33 | 'handlers': {'wsgi': { |
| 34 | 'class': 'logging.StreamHandler', |
| 35 | 'stream': 'ext://flask.logging.wsgi_errors_stream', |
| 36 | 'formatter': 'default' |
| 37 | }}, |
| 38 | 'root': { |
| 39 | 'level': 'INFO', |
| 40 | 'handlers': ['wsgi'] |
| 41 | } |
| 42 | }) |
| 43 | |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 44 | app = Flask(__name__) |
Andy Bavier | 2d60fc5 | 2021-05-04 16:13:39 -0700 | [diff] [blame] | 45 | |
| 46 | edgeSchema = { |
| 47 | "type": "object", |
| 48 | "properties": { |
| 49 | "name": {"type": "string"}, |
| 50 | "status": { |
| 51 | "type": "object", |
| 52 | "properties": { |
| 53 | "control_plane": {"type": "string"}, |
| 54 | "user_plane": {"type": "string"} |
| 55 | }, |
| 56 | "required": ["control_plane", "user_plane"] |
| 57 | }, |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 58 | "dongle_stats": { |
| 59 | "type": "object", |
| 60 | "properties": { |
| 61 | "SuccessfulFetch": {"type": "boolean"}, |
| 62 | "MAC": {"type": "string"}, |
| 63 | "PLMNStatus": {"type": "string"}, |
| 64 | "UICCStatus": {"type": "string"}, |
| 65 | "IMEI": {"type": "string"}, |
| 66 | "IMSI": {"type": "string"}, |
| 67 | "PLMNSelected": {"type": "string"}, |
| 68 | "MCC": {"type": "string"}, |
| 69 | "MNC": {"type": "string"}, |
| 70 | "PhyCellID": {"type": "string"}, |
| 71 | "CellGlobalID": {"type": "string"}, |
| 72 | "Band": {"type": "string"}, |
| 73 | "EARFCN": {"type": "string"}, |
| 74 | "BandWidth": {"type": "string"}, |
| 75 | "ServCellState": {"type": "string"}, |
| 76 | "Connection": {"type": "string"}, |
| 77 | "IPv4Addr": {"type": "string"} |
| 78 | } |
| 79 | }, |
Andy Bavier | 2d60fc5 | 2021-05-04 16:13:39 -0700 | [diff] [blame] | 80 | "speedtest": { |
| 81 | "type": "object", |
| 82 | "properties": { |
| 83 | "ping": { |
| 84 | "type": "object", |
| 85 | "properties": { |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 86 | "dry_run": { |
| 87 | "type": "object", |
| 88 | "properties": { |
| 89 | "transmitted": {"type": "number"}, |
| 90 | "received": {"type": "number"}, |
| 91 | "median": {"type": "number"}, |
| 92 | "min": {"type": "number"}, |
| 93 | "avg": {"type": "number"}, |
| 94 | "max": {"type": "number"}, |
| 95 | "stddev": {"type": "number"} |
| 96 | }, |
| 97 | "required": ["min", "avg", "max", "stddev"] |
| 98 | }, |
Andy Bavier | 2d60fc5 | 2021-05-04 16:13:39 -0700 | [diff] [blame] | 99 | "dns": { |
| 100 | "type": "object", |
| 101 | "properties": { |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 102 | "transmitted": {"type": "number"}, |
| 103 | "received": {"type": "number"}, |
| 104 | "median": {"type": "number"}, |
Andy Bavier | 2d60fc5 | 2021-05-04 16:13:39 -0700 | [diff] [blame] | 105 | "min": {"type": "number"}, |
| 106 | "avg": {"type": "number"}, |
| 107 | "max": {"type": "number"}, |
| 108 | "stddev": {"type": "number"} |
| 109 | }, |
| 110 | "required": ["min", "avg", "max", "stddev"] |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 111 | }, |
| 112 | "iperf_server": { |
| 113 | "type": "object", |
| 114 | "properties": { |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 115 | "transmitted": {"type": "number"}, |
| 116 | "received": {"type": "number"}, |
| 117 | "median": {"type": "number"}, |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 118 | "min": {"type": "number"}, |
| 119 | "avg": {"type": "number"}, |
| 120 | "max": {"type": "number"}, |
| 121 | "stddev": {"type": "number"} |
| 122 | }, |
| 123 | "required": ["min", "avg", "max", "stddev"] |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 124 | }, |
| 125 | "management_server": { |
| 126 | "type": "object", |
| 127 | "properties": { |
| 128 | "transmitted": {"type": "number"}, |
| 129 | "received": {"type": "number"}, |
| 130 | "median": {"type": "number"}, |
| 131 | "min": {"type": "number"}, |
| 132 | "avg": {"type": "number"}, |
| 133 | "max": {"type": "number"}, |
| 134 | "stddev": {"type": "number"} |
| 135 | }, |
| 136 | "required": ["min", "avg", "max", "stddev"] |
| 137 | }, |
Andy Bavier | 2d60fc5 | 2021-05-04 16:13:39 -0700 | [diff] [blame] | 138 | } |
| 139 | }, |
| 140 | "iperf": { |
| 141 | "type": "object", |
| 142 | "properties": { |
| 143 | "cluster": { |
| 144 | "type": "object", |
| 145 | "properties": { |
| 146 | "downlink": {"type": "number"}, |
| 147 | "uplink": {"type": "number"} |
| 148 | }, |
| 149 | "required": ["downlink", "uplink"] |
| 150 | } |
| 151 | } |
| 152 | } |
| 153 | } |
| 154 | }, |
| 155 | "signal_quality": { |
| 156 | "type": "object", |
| 157 | "properties": { |
| 158 | "rsrq": {"type": "number"}, |
| 159 | "rsrp": {"type": "number"} |
| 160 | }, |
| 161 | "required": ["rsrq", "rsrp"] |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 162 | }, |
| 163 | "counters": { |
| 164 | "type": "object", |
| 165 | "properties": { |
| 166 | 'dongle_read_error': {"type": "number"}, |
| 167 | 'dongle_connect_error': {"type": "number"}, |
| 168 | 'dongle_rsrp_rsrq_error': {"type": "number"}, |
| 169 | 'modem_cfun0_error': {"type": "number"}, |
| 170 | 'modem_cfun1_error': {"type": "number"}, |
| 171 | 'modem_cgatt_error': {"type": "number"}, |
| 172 | 'modem_cesq_error': {"type": "number"}, |
| 173 | 'dry_run_ping_error': {"type": "number"}, |
| 174 | 'ping_error': {"type": "number"}, |
| 175 | 'iperf_error': {"type": "number"}, |
| 176 | 'report_send_error': {"type": "number"} |
| 177 | } |
Andy Bavier | 2d60fc5 | 2021-05-04 16:13:39 -0700 | [diff] [blame] | 178 | } |
| 179 | }, |
| 180 | "required": ["name", "status"] |
| 181 | } |
| 182 | |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 183 | edges = [ |
| 184 | { |
Andy Bavier | 8a5c987 | 2020-10-21 13:17:53 -0700 | [diff] [blame] | 185 | 'name': 'ace-example', |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 186 | 'status': { |
| 187 | 'control_plane': 'connected', |
| 188 | 'user_plane': 'connected' |
| 189 | }, |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 190 | 'dongle_stats': { |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 191 | 'SuccessfulFetch': False |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 192 | }, |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 193 | 'speedtest': { |
| 194 | 'ping': { |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 195 | 'dry_run': { |
| 196 | 'transmitted': 0, |
| 197 | 'received': 0, |
| 198 | 'median': 0.0, |
| 199 | 'min': 0.0, |
| 200 | 'avg': 0.0, |
| 201 | 'max': 0.0, |
| 202 | 'stddev': 0.0 |
| 203 | }, |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 204 | 'dns': { |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 205 | 'transmitted': 0, |
| 206 | 'received': 0, |
| 207 | 'median': 0.0, |
Jeremy Ronquillo | a944fbc | 2021-03-30 10:57:45 -0700 | [diff] [blame] | 208 | 'min': 0.0, |
| 209 | 'avg': 0.0, |
| 210 | 'max': 0.0, |
| 211 | 'stddev': 0.0 |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 212 | }, |
| 213 | 'iperf_server': { |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 214 | 'transmitted': 0, |
| 215 | 'received': 0, |
| 216 | 'median': 0.0, |
| 217 | 'min': 0.0, |
| 218 | 'avg': 0.0, |
| 219 | 'max': 0.0, |
| 220 | 'stddev': 0.0 |
| 221 | }, |
| 222 | 'management_server': { |
| 223 | 'transmitted': 0, |
| 224 | 'received': 0, |
| 225 | 'median': 0.0, |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 226 | 'min': 0.0, |
| 227 | 'avg': 0.0, |
| 228 | 'max': 0.0, |
| 229 | 'stddev': 0.0 |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 230 | } |
Jeremy Ronquillo | c743462 | 2021-04-08 21:06:00 -0700 | [diff] [blame] | 231 | }, |
| 232 | 'iperf': { |
| 233 | 'cluster': { |
| 234 | 'downlink': 0.0, |
| 235 | 'uplink': 0.0 |
| 236 | } |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 237 | } |
| 238 | }, |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 239 | 'signal_quality': { |
| 240 | 'rsrq': 0, |
| 241 | 'rsrp': 0 |
| 242 | }, |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 243 | 'counters': { |
| 244 | 'dongle_read_error': 0, |
| 245 | 'dongle_connect_error': 0, |
| 246 | 'dongle_rsrp_rsrq_error': 0, |
| 247 | 'modem_cfun0_error': 0, |
| 248 | 'modem_cfun1_error': 0, |
| 249 | 'modem_cgatt_error': 0, |
| 250 | 'modem_cesq_error': 0, |
| 251 | 'dry_run_ping_error': 0, |
| 252 | 'ping_error': 0, |
| 253 | 'iperf_error': 0, |
| 254 | 'report_send_error': 0 |
| 255 | }, |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 256 | 'last_update': time.time() |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 257 | } |
| 258 | ] |
| 259 | |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 260 | status_codes = { |
| 261 | "no result": -2, |
| 262 | "error": -1, |
| 263 | "disconnected": 0, |
| 264 | "connecting": 1, |
| 265 | "connected": 2 |
| 266 | } |
| 267 | |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 268 | room_mapping = { |
Andy Bavier | e459122 | 2021-07-07 12:44:19 -0700 | [diff] [blame] | 269 | "ace-menlo-rasp-pi-production": "(Compute)-MP-1-Aether Production", |
Andy Bavier | 0423cbd | 2020-10-23 10:50:29 -0700 | [diff] [blame] | 270 | "ace-menlo-staging": "(Compute)-MP-1-Aether Staging" |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 271 | } |
| 272 | |
Jeremy Ronquillo | 1eaff6a | 2021-11-16 13:46:46 -0800 | [diff] [blame] | 273 | plmnstatus_mapping = { |
| 274 | "Not Searching": 1, |
| 275 | "Searching": 2, |
| 276 | "Success": 3 |
| 277 | } |
| 278 | |
Andy Bavier | 5b4e28f | 2021-03-09 15:48:20 -0700 | [diff] [blame] | 279 | # Legacy test status metrics, reporting a status code between -2 and 2 |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 280 | cp_status = prom.Gauge("aetheredge_status_control_plane", "Control plane status code", ["name"]) |
| 281 | up_status = prom.Gauge("aetheredge_status_user_plane", "User plane status code", ["name"]) |
Andy Bavier | 5b4e28f | 2021-03-09 15:48:20 -0700 | [diff] [blame] | 282 | |
| 283 | # Simplified binary test result metrics |
Andy Bavier | 3c7b78d | 2021-03-11 14:16:43 -0700 | [diff] [blame] | 284 | e2e_tests_ok = prom.Gauge("aetheredge_e2e_tests_ok", "Last connect and ping test both passed", ["name"]) |
Andy Bavier | a0c40aa | 2021-03-10 12:09:12 -0700 | [diff] [blame] | 285 | connect_test_ok = prom.Gauge("aetheredge_connect_test_ok", "Last connect test passed", ["name"]) |
Andy Bavier | a0c40aa | 2021-03-10 12:09:12 -0700 | [diff] [blame] | 286 | ping_test_ok = prom.Gauge("aetheredge_ping_test_ok", "Last ping test passed", ["name"]) |
Andy Bavier | 3c7b78d | 2021-03-11 14:16:43 -0700 | [diff] [blame] | 287 | e2e_tests_down = prom.Gauge("aetheredge_e2e_tests_down", "E2E tests not reporting", ["name"]) |
Andy Bavier | 5b4e28f | 2021-03-09 15:48:20 -0700 | [diff] [blame] | 288 | |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 289 | # Dongle Stats (strings can't be stored in Prometheus) |
| 290 | dongle_stats_imsi = prom.Gauge("aetheredge_dongle_stats_imsi", "IMSI of the UE", ["name"]) |
Jeremy Ronquillo | 1eaff6a | 2021-11-16 13:46:46 -0800 | [diff] [blame] | 291 | dongle_stats_cellglobalid = prom.Gauge("aetheredge_dongle_stats_cellglobalid", "CellGlobalID of the UE", ["name"]) |
| 292 | dongle_stats_plmnstatus = prom.Gauge("aetheredge_dongle_stats_plmnstatus", "PLMNStatus of the UE", ["name"]) |
| 293 | dongle_stats_phycellid = prom.Gauge("aetheredge_dongle_stats_phycellid", "PhyCellID of the UE", ["name"]) |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 294 | |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 295 | # Ping dry_run metrics |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 296 | ping_dry_run_transmitted = prom.Gauge("aetheredge_ping_dry_run_test_transmitted", "Last ping test to dry_run number of transmitted packets", ["name"]) |
| 297 | ping_dry_run_received = prom.Gauge("aetheredge_ping_dry_run_test_received", "Last ping test to dry_run number of received packets",["name"]) |
| 298 | ping_dry_run_median = prom.Gauge("aetheredge_ping_dry_run_test_median", "Last ping test to dry_run median value", ["name"]) |
| 299 | ping_dry_run_min = prom.Gauge("aetheredge_ping_dry_run_test_min", "Last ping test to dry_run minimum value", ["name"]) |
| 300 | ping_dry_run_avg = prom.Gauge("aetheredge_ping_dry_run_test_avg", "Last ping test to dry_run average", ["name"]) |
| 301 | ping_dry_run_max = prom.Gauge("aetheredge_ping_dry_run_test_max", "Last ping test to dry_run maximum value", ["name"]) |
| 302 | ping_dry_run_stddev = prom.Gauge("aetheredge_ping_dry_run_test_stddev", "Last ping test to dry_run standard deviation", ["name"]) |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 303 | |
| 304 | # Ping dns metrics |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 305 | ping_dns_transmitted = prom.Gauge("aetheredge_ping_dns_test_transmitted", "Last ping test to dns number of transmitted packets", ["name"]) |
| 306 | ping_dns_received = prom.Gauge("aetheredge_ping_dns_test_received", "Last ping test to dns number of received packets", ["name"]) |
| 307 | ping_dns_median = prom.Gauge("aetheredge_ping_dns_test_median", "Last ping test to dns median value",["name"]) |
| 308 | ping_dns_min = prom.Gauge("aetheredge_ping_dns_test_min", "Last ping test to dns minimum value",["name"]) |
| 309 | ping_dns_avg = prom.Gauge("aetheredge_ping_dns_test_avg", "Last ping test to dns average",["name"]) |
| 310 | ping_dns_max = prom.Gauge("aetheredge_ping_dns_test_max", "Last ping test to dns maximum value",["name"]) |
| 311 | ping_dns_stddev = prom.Gauge("aetheredge_ping_dns_test_stddev", "Last ping test to dns standard deviation",["name"]) |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 312 | |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 313 | # Ping iperf server metrics |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 314 | ping_iperf_server_transmitted = prom.Gauge("aetheredge_ping_iperf_server_test_transmitted","Last ping test to iperf_server number of transmitted packets", ["name"]) |
| 315 | ping_iperf_server_received = prom.Gauge("aetheredge_ping_iperf_server_test_received","Last ping test to iperf_server number of received packets", ["name"]) |
| 316 | ping_iperf_server_median = prom.Gauge("aetheredge_ping_iperf_server_test_median","Last ping test to iperf_server median value", ["name"]) |
| 317 | ping_iperf_server_min = prom.Gauge("aetheredge_ping_iperf_server_test_min","Last ping test to iperf_server minimum value", ["name"]) |
| 318 | ping_iperf_server_avg = prom.Gauge("aetheredge_ping_iperf_server_test_avg","Last ping test to iperf_server average", ["name"]) |
| 319 | ping_iperf_server_max = prom.Gauge("aetheredge_ping_iperf_server_test_max","Last ping test to iperf_server maximum value", ["name"]) |
| 320 | ping_iperf_server_stddev = prom.Gauge("aetheredge_ping_iperf_server_test_stddev","Last ping test to iperf_server standard deviation", ["name"]) |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 321 | |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 322 | # Ping management_server metrics |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 323 | ping_management_server_transmitted = prom.Gauge("aetheredge_ping_management_server_test_transmitted","Last ping test to management_server number of transmitted packets", ["name"]) |
| 324 | ping_management_server_received = prom.Gauge("aetheredge_ping_management_server_test_received","Last ping test to management_server number of received packets", ["name"]) |
| 325 | ping_management_server_median = prom.Gauge("aetheredge_ping_management_server_test_median","Last ping test to management_server median value", ["name"]) |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 326 | ping_management_server_min = prom.Gauge("aetheredge_ping_management_server_test_min","Last ping test to management_server minimum value",["name"]) |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 327 | ping_management_server_avg = prom.Gauge("aetheredge_ping_management_server_test_avg","Last ping test to management_server average", ["name"]) |
| 328 | ping_management_server_max = prom.Gauge("aetheredge_ping_management_server_test_max","Last ping test to management_server maximum value", ["name"]) |
| 329 | ping_management_server_stddev = prom.Gauge("aetheredge_ping_management_server_test_stddev","Last ping test to management_server standard deviation", ["name"]) |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 330 | |
Jeremy Ronquillo | c743462 | 2021-04-08 21:06:00 -0700 | [diff] [blame] | 331 | # Speedtest iperf metrics |
| 332 | iperf_cluster_downlink = prom.Gauge("aetheredge_iperf_cluster_downlink_test","Last iperf test downlink result",["name"]) |
| 333 | iperf_cluster_uplink = prom.Gauge("aetheredge_iperf_cluster_uplink_test","Last iperf test downlink result",["name"]) |
| 334 | |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 335 | # Signal quality metrics in CESQ format not dB |
| 336 | # RSRQ: >=53 excellent, 43 ~ 53 good, 33 ~ 43 mid, <=33 bad, 0 no signal |
| 337 | # RSRP: >=20 excellent, 10 ~ 20 good, 0 ~ 10 mid, 0 no signal |
| 338 | signal_quality_rsrq = prom.Gauge("aetheredge_signal_quality_rsrq", "Quality of the received signal", ["name"]) |
| 339 | signal_quality_rsrp = prom.Gauge("aetheredge_signal_quality_rsrp", "Power of the received signal", ["name"]) |
| 340 | |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 341 | counters_dongle_read_error = prom.Gauge("aetheredge_counters_dongle_read_error", "Dongle read error counter", ["name"]) |
| 342 | counters_dongle_connect_error = prom.Gauge("aetheredge_counters_dongle_connect_error", "Dongle connect error counter", ["name"]) |
| 343 | counters_dongle_rsrp_rsrq_error = prom.Gauge("aetheredge_counters_dongle_rsrp_rsrq_error", "Dongle rsrp/rsrq error counter", ["name"]) |
| 344 | counters_modem_cfun0_error = prom.Gauge("aetheredge_counters_modem_cfun0_error", "Modem cfun0 error counter", ["name"]) |
| 345 | counters_modem_cfun1_error = prom.Gauge("aetheredge_counters_modem_cfun1_error", "Modem cfun1 error counter", ["name"]) |
| 346 | counters_modem_cgatt_error = prom.Gauge("aetheredge_counters_modem_cgatt_error", "Modem cgatt error counter", ["name"]) |
| 347 | counters_modem_cesq_error = prom.Gauge("aetheredge_counters_modem_cesq_error", "Modem cesq error counter", ["name"]) |
| 348 | counters_dry_run_ping_error = prom.Gauge("aetheredge_counters_dry_run_ping_error", "Dry run ping error counter", ["name"]) |
| 349 | counters_ping_error = prom.Gauge("aetheredge_counters_ping_error", "Ping error counter", ["name"]) |
| 350 | counters_iperf_error = prom.Gauge("aetheredge_counters_iperf_error", "Iperf error counter", ["name"]) |
| 351 | counters_report_send_error = prom.Gauge("aetheredge_counters_report_send_error", "Report send error counter", ["name"]) |
| 352 | |
Andy Bavier | 5b4e28f | 2021-03-09 15:48:20 -0700 | [diff] [blame] | 353 | # Other metrics |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 354 | last_update = prom.Gauge("aetheredge_last_update", "Last reported test result", ["name"]) |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 355 | maint_window = prom.Gauge("aetheredge_in_maintenance_window", "Currently in a maintenance window", ["name"]) |
| 356 | |
| 357 | def is_my_event(event, name): |
| 358 | for field in ["summary", "location", "description"]: |
Andy Bavier | 8a5c987 | 2020-10-21 13:17:53 -0700 | [diff] [blame] | 359 | fullname = name |
| 360 | if name.startswith("ace-"): |
| 361 | fullname = "%s-%s" % (name, AETHER_ENV) |
| 362 | if fullname in getattr(event, field, ""): |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 363 | return True |
Andy Bavier | 0423cbd | 2020-10-23 10:50:29 -0700 | [diff] [blame] | 364 | if fullname in room_mapping and room_mapping[fullname] in getattr(event, field, ""): |
| 365 | return True |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 366 | return False |
| 367 | |
Andy Bavier | c41cf0c | 2020-09-02 14:49:21 -0700 | [diff] [blame] | 368 | def is_naive_datetime(d): |
| 369 | return d.tzinfo is None or d.tzinfo.utcoffset(d) is None |
| 370 | |
| 371 | def process_all_day_events(es): |
| 372 | for event in es: |
| 373 | if event.all_day: |
| 374 | # All day events have naive datetimes, which breaks comparisons |
| 375 | pacific = pytz.timezone('US/Pacific') |
| 376 | if is_naive_datetime(event.start): |
| 377 | event.start = pacific.localize(event.start) |
| 378 | if is_naive_datetime(event.end): |
| 379 | event.end = pacific.localize(event.end) |
| 380 | |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 381 | def in_maintenance_window(events, name, now): |
| 382 | for event in events: |
| 383 | if event.start < now and event.end > now: |
| 384 | if is_my_event(event, name): |
| 385 | return True |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 386 | return False |
| 387 | |
| 388 | def pull_maintenance_events(): |
| 389 | while(True): |
| 390 | now = datetime.datetime.now(pytz.utc) |
| 391 | try: |
| 392 | es = events(SECRET_ICAL_URL, start = now) |
Andy Bavier | c41cf0c | 2020-09-02 14:49:21 -0700 | [diff] [blame] | 393 | process_all_day_events(es) |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 394 | except Exception as e: |
Andy Bavier | 55dc587 | 2021-05-05 11:31:42 -0700 | [diff] [blame] | 395 | app.logger.error(e) |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 396 | else: |
| 397 | for edge in edges: |
| 398 | if 'maintenance' not in edge: |
| 399 | edge['maintenance'] = {} |
| 400 | edge['maintenance']['in_window'] = in_maintenance_window(es, edge['name'], now) |
| 401 | edge['maintenance']['last_update'] = time.time() |
| 402 | time.sleep(60) |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 403 | |
| 404 | def time_out_stale_results(): |
| 405 | for edge in edges: |
| 406 | time_elapsed = time.time() - edge["last_update"] |
| 407 | if time_elapsed > NO_RESULT_THRESHOLD: |
| 408 | edge['status']['control_plane'] = "no result" |
| 409 | edge['status']['user_plane'] = "no result" |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 410 | edge['dongle_stats'] = {'SuccessfulFetch': False} |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 411 | edge['speedtest']['ping']['dry_run'] = {'transmitted': 0, |
| 412 | 'received': 0, |
| 413 | 'median': 0.0, |
| 414 | 'min': 0.0, |
| 415 | 'avg': 0.0, |
| 416 | 'max': 0.0, |
| 417 | 'stddev': 0.0} |
| 418 | edge['speedtest']['ping']['dns'] = {'transmitted': 0, |
| 419 | 'received': 0, |
| 420 | 'median': 0.0, |
| 421 | 'min': 0.0, |
Jeremy Ronquillo | a944fbc | 2021-03-30 10:57:45 -0700 | [diff] [blame] | 422 | 'avg': 0.0, |
| 423 | 'max': 0.0, |
| 424 | 'stddev': 0.0} |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 425 | edge['speedtest']['ping']['iperf_server'] = {'transmitted': 0, |
| 426 | 'received': 0, |
| 427 | 'median': 0.0, |
| 428 | 'min': 0.0, |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 429 | 'avg': 0.0, |
| 430 | 'max': 0.0, |
| 431 | 'stddev': 0.0} |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 432 | edge['speedtest']['ping']['management_server'] = {'transmitted': 0, |
| 433 | 'received': 0, |
| 434 | 'median': 0.0, |
| 435 | 'min': 0.0, |
| 436 | 'avg': 0.0, |
| 437 | 'max': 0.0, |
| 438 | 'stddev': 0.0} |
Jeremy Ronquillo | 56b0a1e | 2021-04-09 00:26:18 -0700 | [diff] [blame] | 439 | edge['speedtest']['iperf'] = {'cluster': { |
| 440 | 'downlink': 0.0, |
| 441 | 'uplink': 0.0 |
| 442 | } |
| 443 | } |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 444 | edge.pop('signal_quality', None) |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 445 | |
Andy Bavier | e47157d | 2020-12-11 14:13:12 -0700 | [diff] [blame] | 446 | def remove_edge_from_metrics(name): |
| 447 | try: |
| 448 | cp_status.remove(name) |
| 449 | up_status.remove(name) |
| 450 | last_update.remove(name) |
Andy Bavier | 3c7b78d | 2021-03-11 14:16:43 -0700 | [diff] [blame] | 451 | e2e_tests_ok.remove(name) |
Andy Bavier | a0c40aa | 2021-03-10 12:09:12 -0700 | [diff] [blame] | 452 | connect_test_ok.remove(name) |
Andy Bavier | a0c40aa | 2021-03-10 12:09:12 -0700 | [diff] [blame] | 453 | ping_test_ok.remove(name) |
Andy Bavier | 3c7b78d | 2021-03-11 14:16:43 -0700 | [diff] [blame] | 454 | e2e_tests_down.remove(name) |
Andy Bavier | 5b4e28f | 2021-03-09 15:48:20 -0700 | [diff] [blame] | 455 | except: |
| 456 | pass |
| 457 | |
| 458 | try: |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 459 | dongle_stats_imsi.remove(name) |
Jeremy Ronquillo | 1eaff6a | 2021-11-16 13:46:46 -0800 | [diff] [blame] | 460 | dongle_stats_cellglobalid.remove(name) |
| 461 | dongle_stats_plmnstatus.remove(name) |
| 462 | dongle_stats_phycellid.remove(name) |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 463 | except: |
| 464 | pass |
| 465 | |
| 466 | try: |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 467 | ping_dry_run_min.remove(name) |
| 468 | ping_dry_run_avg.remove(name) |
| 469 | ping_dry_run_max.remove(name) |
| 470 | ping_dry_run_stddev.remove(name) |
| 471 | ping_dry_run_transmitted.remove(name) |
| 472 | ping_dry_run_received.remove(name) |
| 473 | ping_dry_run_median.remove(name) |
| 474 | except: |
| 475 | pass |
| 476 | |
| 477 | try: |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 478 | ping_dns_min.remove(name) |
| 479 | ping_dns_avg.remove(name) |
| 480 | ping_dns_max.remove(name) |
| 481 | ping_dns_stddev.remove(name) |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 482 | ping_dns_transmitted.remove(name) |
| 483 | ping_dns_received.remove(name) |
| 484 | ping_dns_median.remove(name) |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 485 | except: |
| 486 | pass |
| 487 | |
| 488 | try: |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 489 | ping_iperf_server_min.remove(name) |
| 490 | ping_iperf_server_avg.remove(name) |
| 491 | ping_iperf_server_max.remove(name) |
| 492 | ping_iperf_server_stddev.remove(name) |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 493 | ping_iperf_server_transmitted.remove(name) |
| 494 | ping_iperf_server_received.remove(name) |
| 495 | ping_iperf_server_median.remove(name) |
| 496 | except: |
| 497 | pass |
| 498 | |
| 499 | try: |
| 500 | ping_management_server_min.remove(name) |
| 501 | ping_management_server_avg.remove(name) |
| 502 | ping_management_server_max.remove(name) |
| 503 | ping_management_server_stddev.remove(name) |
| 504 | ping_management_server_transmitted.remove(name) |
| 505 | ping_management_server_received.remove(name) |
| 506 | ping_management_server_median.remove(name) |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 507 | except: |
| 508 | pass |
| 509 | |
| 510 | try: |
Jeremy Ronquillo | c743462 | 2021-04-08 21:06:00 -0700 | [diff] [blame] | 511 | iperf_cluster_downlink.remove(name) |
| 512 | iperf_cluster_uplink.remove(name) |
| 513 | except: |
| 514 | pass |
| 515 | |
| 516 | try: |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 517 | signal_quality_rsrq.remove(name) |
| 518 | signal_quality_rsrp.remove(name) |
| 519 | except: |
| 520 | pass |
| 521 | |
| 522 | try: |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 523 | counters_dongle_read_error.remove(name) |
| 524 | counters_dongle_connect_error.remove(name) |
| 525 | counters_dongle_rsrp_rsrq_error.remove(name) |
| 526 | counters_modem_cfun0_error.remove(name) |
| 527 | counters_modem_cfun1_error.remove(name) |
| 528 | counters_modem_cgatt_error.remove(name) |
| 529 | counters_modem_cesq_error.remove(name) |
| 530 | counters_dry_run_ping_error.remove(name) |
| 531 | counters_ping_error.remove(name) |
| 532 | counters_iperf_error.remove(name) |
| 533 | counters_report_send_error.remove(name) |
| 534 | except: |
| 535 | pass |
| 536 | |
| 537 | try: |
Andy Bavier | e47157d | 2020-12-11 14:13:12 -0700 | [diff] [blame] | 538 | maint_window.remove(name) |
| 539 | except: |
| 540 | pass |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 541 | |
| 542 | @app.route('/edges/metrics', methods=['GET']) |
| 543 | def get_prometheus_metrics(): |
| 544 | res = [] |
| 545 | time_out_stale_results() |
| 546 | for edge in edges: |
Andy Bavier | 8a5c987 | 2020-10-21 13:17:53 -0700 | [diff] [blame] | 547 | if edge['name'] == "ace-example": |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 548 | continue |
| 549 | |
Andy Bavier | 3c7b78d | 2021-03-11 14:16:43 -0700 | [diff] [blame] | 550 | connect_status = edge['status']['control_plane'] |
| 551 | ping_status = edge['status']['user_plane'] |
| 552 | |
Jeremy Ronquillo | cd711a2 | 2021-11-18 10:37:56 -0800 | [diff] [blame] | 553 | # Add PLMN Status |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 554 | try: |
Jeremy Ronquillo | cd711a2 | 2021-11-18 10:37:56 -0800 | [diff] [blame] | 555 | if edge['dongle_stats']['PLMNStatus'] and edge['dongle_stats']['PLMNStatus'] in plmnstatus_mapping: |
Jeremy Ronquillo | 1eaff6a | 2021-11-16 13:46:46 -0800 | [diff] [blame] | 556 | dongle_stats_plmnstatus.labels(edge['name']).set(plmnstatus_mapping[edge['dongle_stats']['PLMNStatus']]) |
| 557 | else: |
Jeremy Ronquillo | cd711a2 | 2021-11-18 10:37:56 -0800 | [diff] [blame] | 558 | pass |
| 559 | except: |
| 560 | pass |
| 561 | |
| 562 | # Add IMSI |
| 563 | try: |
| 564 | if edge['dongle_stats']['IMSI']: |
| 565 | dongle_stats_imsi.labels(edge['name']).set(float(edge['dongle_stats']['IMSI'])) |
| 566 | except: |
| 567 | pass |
| 568 | |
| 569 | # Add CellGlobalID |
| 570 | try: |
| 571 | if edge['dongle_stats']['CellGlobalID']: |
| 572 | dongle_stats_cellglobalid.labels(edge['name']).set(int(edge['dongle_stats']['CellGlobalID'], 16)) |
| 573 | except: |
| 574 | pass |
| 575 | |
| 576 | # Add PhyCellID |
| 577 | try: |
| 578 | if edge['dongle_stats']['PhyCellID']: |
| 579 | dongle_stats_phycellid.labels(edge['name']).set(edge['dongle_stats']['PhyCellID']) |
| 580 | except: |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 581 | pass |
| 582 | |
Shad Ansari | 5e0d59a | 2022-03-17 21:31:02 -0700 | [diff] [blame^] | 583 | # Add ping dry_run latency results |
| 584 | ping_dry_run_min.labels(edge['name']).set(edge['speedtest']['ping']['dry_run']['min']) |
| 585 | ping_dry_run_avg.labels(edge['name']).set(edge['speedtest']['ping']['dry_run']['avg']) |
| 586 | ping_dry_run_max.labels(edge['name']).set(edge['speedtest']['ping']['dry_run']['max']) |
| 587 | ping_dry_run_stddev.labels(edge['name']).set(edge['speedtest']['ping']['dry_run']['stddev']) |
| 588 | ping_dry_run_transmitted.labels(edge['name']).set(edge['speedtest']['ping']['dry_run']['transmitted']) |
| 589 | ping_dry_run_received.labels(edge['name']).set(edge['speedtest']['ping']['dry_run']['received']) |
| 590 | ping_dry_run_median.labels(edge['name']).set(edge['speedtest']['ping']['dry_run']['median']) |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 591 | |
Shad Ansari | 5e0d59a | 2022-03-17 21:31:02 -0700 | [diff] [blame^] | 592 | # Add ping dns latency results |
| 593 | ping_dns_min.labels(edge['name']).set(edge['speedtest']['ping']['dns']['min']) |
| 594 | ping_dns_avg.labels(edge['name']).set(edge['speedtest']['ping']['dns']['avg']) |
| 595 | ping_dns_max.labels(edge['name']).set(edge['speedtest']['ping']['dns']['max']) |
| 596 | ping_dns_stddev.labels(edge['name']).set(edge['speedtest']['ping']['dns']['stddev']) |
| 597 | ping_dns_transmitted.labels(edge['name']).set(edge['speedtest']['ping']['dns']['transmitted']) |
| 598 | ping_dns_received.labels(edge['name']).set(edge['speedtest']['ping']['dns']['received']) |
| 599 | ping_dns_median.labels(edge['name']).set(edge['speedtest']['ping']['dns']['median']) |
Jeremy Ronquillo | c743462 | 2021-04-08 21:06:00 -0700 | [diff] [blame] | 600 | |
Shad Ansari | 5e0d59a | 2022-03-17 21:31:02 -0700 | [diff] [blame^] | 601 | # Add ping iperf_server latency results |
| 602 | ping_iperf_server_min.labels(edge['name']).set(edge['speedtest']['ping']['iperf_server']['min']) |
| 603 | ping_iperf_server_avg.labels(edge['name']).set(edge['speedtest']['ping']['iperf_server']['avg']) |
| 604 | ping_iperf_server_max.labels(edge['name']).set(edge['speedtest']['ping']['iperf_server']['max']) |
| 605 | ping_iperf_server_stddev.labels(edge['name']).set(edge['speedtest']['ping']['iperf_server']['stddev']) |
| 606 | ping_iperf_server_transmitted.labels(edge['name']).set(edge['speedtest']['ping']['iperf_server']['transmitted']) |
| 607 | ping_iperf_server_received.labels(edge['name']).set(edge['speedtest']['ping']['iperf_server']['received']) |
| 608 | ping_iperf_server_median.labels(edge['name']).set(edge['speedtest']['ping']['iperf_server']['median']) |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 609 | |
Shad Ansari | 5e0d59a | 2022-03-17 21:31:02 -0700 | [diff] [blame^] | 610 | # Add ping management_server latency results |
| 611 | ping_management_server_min.labels(edge['name']).set(edge['speedtest']['ping']['management_server']['min']) |
| 612 | ping_management_server_avg.labels(edge['name']).set(edge['speedtest']['ping']['management_server']['avg']) |
| 613 | ping_management_server_max.labels(edge['name']).set(edge['speedtest']['ping']['management_server']['max']) |
| 614 | ping_management_server_stddev.labels(edge['name']).set(edge['speedtest']['ping']['management_server']['stddev']) |
| 615 | ping_management_server_transmitted.labels(edge['name']).set(edge['speedtest']['ping']['management_server']['transmitted']) |
| 616 | ping_management_server_received.labels(edge['name']).set(edge['speedtest']['ping']['management_server']['received']) |
| 617 | ping_management_server_median.labels(edge['name']).set(edge['speedtest']['ping']['management_server']['median']) |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 618 | |
Shad Ansari | 5e0d59a | 2022-03-17 21:31:02 -0700 | [diff] [blame^] | 619 | # Add iperf bandwidth results |
| 620 | iperf_cluster_downlink.labels(edge['name']).set(edge['speedtest']['iperf']['cluster']['downlink']) |
| 621 | iperf_cluster_uplink.labels(edge['name']).set(edge['speedtest']['iperf']['cluster']['uplink']) |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 622 | |
Andy Bavier | 3c7b78d | 2021-03-11 14:16:43 -0700 | [diff] [blame] | 623 | cp_status.labels(edge['name']).set(status_codes[connect_status]) |
| 624 | up_status.labels(edge['name']).set(status_codes[ping_status]) |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 625 | |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 626 | last_update.labels(edge['name']).set(edge['last_update']) |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 627 | if 'maintenance' in edge: |
| 628 | maint_window.labels(edge['name']).set(int(edge['maintenance']['in_window'])) |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 629 | |
Andy Bavier | a0c40aa | 2021-03-10 12:09:12 -0700 | [diff] [blame] | 630 | connect_test_ok.labels(edge['name']).set(0) |
Andy Bavier | a0c40aa | 2021-03-10 12:09:12 -0700 | [diff] [blame] | 631 | ping_test_ok.labels(edge['name']).set(0) |
Andy Bavier | 3c7b78d | 2021-03-11 14:16:43 -0700 | [diff] [blame] | 632 | e2e_tests_ok.labels(edge['name']).set(0) |
| 633 | e2e_tests_down.labels(edge['name']).set(0) |
| 634 | |
| 635 | if connect_status in ["error", "no result"] or ping_status in ["error", "no result"]: |
| 636 | e2e_tests_down.labels(edge['name']).set(1) |
| 637 | else: |
| 638 | if connect_status == "connected": |
| 639 | connect_test_ok.labels(edge['name']).set(1) |
| 640 | if ping_status == "connected": |
| 641 | ping_test_ok.labels(edge['name']).set(1) |
| 642 | if connect_status == "connected" and ping_status == "connected": |
| 643 | e2e_tests_ok.labels(edge['name']).set(1) |
Andy Bavier | 5b4e28f | 2021-03-09 15:48:20 -0700 | [diff] [blame] | 644 | |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 645 | if 'signal_quality' in edge.keys(): |
| 646 | signal_quality_rsrq.labels(edge['name']).set(edge['signal_quality']['rsrq']) |
| 647 | signal_quality_rsrp.labels(edge['name']).set(edge['signal_quality']['rsrp']) |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 648 | |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 649 | if 'counters' in edge.keys(): |
| 650 | counters_dongle_read_error.labels(edge['name']).set(edge['counters']['dongle_read_error']) |
| 651 | counters_dongle_connect_error.labels(edge['name']).set(edge['counters']['dongle_connect_error']) |
| 652 | counters_dongle_rsrp_rsrq_error.labels(edge['name']).set(edge['counters']['dongle_rsrp_rsrq_error']) |
| 653 | counters_modem_cfun0_error.labels(edge['name']).set(edge['counters']['modem_cfun0_error']) |
| 654 | counters_modem_cfun1_error.labels(edge['name']).set(edge['counters']['modem_cfun1_error']) |
| 655 | counters_modem_cgatt_error.labels(edge['name']).set(edge['counters']['modem_cgatt_error']) |
| 656 | counters_modem_cesq_error.labels(edge['name']).set(edge['counters']['modem_cesq_error']) |
| 657 | counters_dry_run_ping_error.labels(edge['name']).set(edge['counters']['dry_run_ping_error']) |
| 658 | counters_ping_error.labels(edge['name']).set(edge['counters']['ping_error']) |
| 659 | counters_iperf_error.labels(edge['name']).set(edge['counters']['iperf_error']) |
| 660 | counters_report_send_error.labels(edge['name']).set(edge['counters']['report_send_error']) |
| 661 | |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 662 | res.append(prom.generate_latest(cp_status)) |
| 663 | res.append(prom.generate_latest(up_status)) |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 664 | |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 665 | res.append(prom.generate_latest(dongle_stats_imsi)) |
| 666 | res.append(prom.generate_latest(dongle_stats_cellglobalid)) |
| 667 | res.append(prom.generate_latest(dongle_stats_plmnstatus)) |
Jeremy Ronquillo | 1eaff6a | 2021-11-16 13:46:46 -0800 | [diff] [blame] | 668 | res.append(prom.generate_latest(dongle_stats_phycellid)) |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 669 | |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 670 | res.append(prom.generate_latest(ping_dry_run_min)) |
| 671 | res.append(prom.generate_latest(ping_dry_run_avg)) |
| 672 | res.append(prom.generate_latest(ping_dry_run_max)) |
| 673 | res.append(prom.generate_latest(ping_dry_run_stddev)) |
| 674 | res.append(prom.generate_latest(ping_dry_run_transmitted)) |
| 675 | res.append(prom.generate_latest(ping_dry_run_received)) |
| 676 | res.append(prom.generate_latest(ping_dry_run_median)) |
| 677 | |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 678 | res.append(prom.generate_latest(ping_dns_min)) |
| 679 | res.append(prom.generate_latest(ping_dns_avg)) |
| 680 | res.append(prom.generate_latest(ping_dns_max)) |
| 681 | res.append(prom.generate_latest(ping_dns_stddev)) |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 682 | res.append(prom.generate_latest(ping_dns_transmitted)) |
| 683 | res.append(prom.generate_latest(ping_dns_received)) |
| 684 | res.append(prom.generate_latest(ping_dns_median)) |
| 685 | |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 686 | res.append(prom.generate_latest(ping_iperf_server_min)) |
| 687 | res.append(prom.generate_latest(ping_iperf_server_avg)) |
| 688 | res.append(prom.generate_latest(ping_iperf_server_max)) |
| 689 | res.append(prom.generate_latest(ping_iperf_server_stddev)) |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 690 | res.append(prom.generate_latest(ping_iperf_server_transmitted)) |
| 691 | res.append(prom.generate_latest(ping_iperf_server_received)) |
| 692 | res.append(prom.generate_latest(ping_iperf_server_median)) |
| 693 | |
| 694 | res.append(prom.generate_latest(ping_management_server_min)) |
| 695 | res.append(prom.generate_latest(ping_management_server_avg)) |
| 696 | res.append(prom.generate_latest(ping_management_server_max)) |
| 697 | res.append(prom.generate_latest(ping_management_server_stddev)) |
| 698 | res.append(prom.generate_latest(ping_management_server_transmitted)) |
| 699 | res.append(prom.generate_latest(ping_management_server_received)) |
| 700 | res.append(prom.generate_latest(ping_management_server_median)) |
| 701 | |
Jeremy Ronquillo | c743462 | 2021-04-08 21:06:00 -0700 | [diff] [blame] | 702 | res.append(prom.generate_latest(iperf_cluster_downlink)) |
| 703 | res.append(prom.generate_latest(iperf_cluster_uplink)) |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 704 | res.append(prom.generate_latest(last_update)) |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 705 | res.append(prom.generate_latest(maint_window)) |
Andy Bavier | a0c40aa | 2021-03-10 12:09:12 -0700 | [diff] [blame] | 706 | res.append(prom.generate_latest(connect_test_ok)) |
Andy Bavier | a0c40aa | 2021-03-10 12:09:12 -0700 | [diff] [blame] | 707 | res.append(prom.generate_latest(ping_test_ok)) |
Andy Bavier | 3c7b78d | 2021-03-11 14:16:43 -0700 | [diff] [blame] | 708 | res.append(prom.generate_latest(e2e_tests_ok)) |
| 709 | res.append(prom.generate_latest(e2e_tests_down)) |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 710 | res.append(prom.generate_latest(signal_quality_rsrq)) |
| 711 | res.append(prom.generate_latest(signal_quality_rsrp)) |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 712 | res.append(prom.generate_latest(counters_dongle_read_error)) |
| 713 | res.append(prom.generate_latest(counters_dongle_connect_error)) |
| 714 | res.append(prom.generate_latest(counters_dongle_rsrp_rsrq_error)) |
| 715 | res.append(prom.generate_latest(counters_modem_cfun0_error)) |
| 716 | res.append(prom.generate_latest(counters_modem_cfun1_error)) |
| 717 | res.append(prom.generate_latest(counters_modem_cgatt_error)) |
| 718 | res.append(prom.generate_latest(counters_modem_cesq_error)) |
| 719 | res.append(prom.generate_latest(counters_dry_run_ping_error)) |
| 720 | res.append(prom.generate_latest(counters_ping_error)) |
| 721 | res.append(prom.generate_latest(counters_iperf_error)) |
| 722 | res.append(prom.generate_latest(counters_report_send_error)) |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 723 | |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 724 | return Response(res, mimetype="text/plain") |
| 725 | |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 726 | |
| 727 | @app.route('/edges/healthz', methods=['GET']) |
| 728 | def get_health(): |
| 729 | return {'message': 'healthy'} |
| 730 | |
| 731 | |
| 732 | @app.route('/edges', methods=['GET']) |
| 733 | def get_edges(): |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 734 | time_out_stale_results() |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 735 | return jsonify({'edges': edges}) |
| 736 | |
| 737 | |
| 738 | @app.route('/edges/<string:name>', methods=['GET']) |
| 739 | def get_edge(name): |
Andy Bavier | 4021a2f | 2020-07-29 12:39:47 -0700 | [diff] [blame] | 740 | time_out_stale_results() |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 741 | edge = [edge for edge in edges if edge['name'] == name] |
| 742 | if len(edge) == 0: |
| 743 | abort(404) |
| 744 | return jsonify({'edge': edge[0]}) |
| 745 | |
| 746 | |
| 747 | @app.route('/edges', methods=['POST']) |
Andy Bavier | f872e9a | 2021-03-22 12:06:25 -0700 | [diff] [blame] | 748 | @app.route('/testresults', methods=['POST']) |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 749 | def create_or_update_edge(): |
Andy Bavier | 2d60fc5 | 2021-05-04 16:13:39 -0700 | [diff] [blame] | 750 | try: |
| 751 | jsonschema.validate(instance=request.json, schema=edgeSchema) |
| 752 | except jsonschema.exceptions.ValidationError as err: |
Andy Bavier | 55dc587 | 2021-05-05 11:31:42 -0700 | [diff] [blame] | 753 | app.logger.warn(err) |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 754 | abort(400) |
| 755 | |
| 756 | req_edge = { |
| 757 | 'name': request.json['name'], |
| 758 | 'status': { |
| 759 | 'control_plane': request.json['status']['control_plane'], |
| 760 | 'user_plane': request.json['status']['user_plane'] |
| 761 | }, |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 762 | 'dongle_stats': { |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 763 | 'SuccessfulFetch': False |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 764 | }, |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 765 | 'speedtest': { |
| 766 | 'ping': { |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 767 | 'dry_run': { |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 768 | 'transmitted': 0, |
| 769 | 'received': 0, |
| 770 | 'median': 0.0, |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 771 | 'min': 0.0, |
| 772 | 'avg': 0.0, |
| 773 | 'max': 0.0, |
| 774 | 'stddev': 0.0 |
| 775 | }, |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 776 | 'dns': { |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 777 | 'transmitted' : 0, |
| 778 | 'received' : 0, |
| 779 | 'median' : 0.0, |
Jeremy Ronquillo | a944fbc | 2021-03-30 10:57:45 -0700 | [diff] [blame] | 780 | 'min': 0.0, |
| 781 | 'avg': 0.0, |
| 782 | 'max': 0.0, |
| 783 | 'stddev': 0.0 |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 784 | }, |
| 785 | 'iperf_server': { |
Jeremy Ronquillo | e0a8b42 | 2021-11-02 12:49:15 -0700 | [diff] [blame] | 786 | 'transmitted' : 0, |
| 787 | 'received' : 0, |
| 788 | 'median' : 0.0, |
| 789 | 'min': 0.0, |
| 790 | 'avg': 0.0, |
| 791 | 'max': 0.0, |
| 792 | 'stddev': 0.0 |
| 793 | }, |
| 794 | 'management_server': { |
| 795 | 'transmitted' : 0, |
| 796 | 'received' : 0, |
| 797 | 'median' : 0.0, |
Jeremy Ronquillo | 6e352b7 | 2021-06-08 10:33:25 -0700 | [diff] [blame] | 798 | 'min': 0.0, |
| 799 | 'avg': 0.0, |
| 800 | 'max': 0.0, |
| 801 | 'stddev': 0.0 |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 802 | } |
Jeremy Ronquillo | c743462 | 2021-04-08 21:06:00 -0700 | [diff] [blame] | 803 | }, |
| 804 | 'iperf': { |
| 805 | 'cluster': { |
| 806 | 'downlink': 0.0, |
| 807 | 'uplink': 0.0 |
| 808 | } |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 809 | } |
| 810 | }, |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 811 | 'counters': { |
| 812 | 'dongle_read_error': 0, |
| 813 | 'dongle_connect_error': 0, |
| 814 | 'dongle_rsrp_rsrq_error': 0, |
| 815 | 'modem_cfun0_error': 0, |
| 816 | 'modem_cfun1_error': 0, |
| 817 | 'modem_cgatt_error': 0, |
| 818 | 'modem_cesq_error': 0, |
| 819 | 'dry_run_ping_error': 0, |
| 820 | 'ping_error': 0, |
| 821 | 'iperf_error': 0, |
| 822 | 'report_send_error': 0 |
| 823 | }, |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 824 | 'last_update': time.time() |
| 825 | } |
| 826 | |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 827 | if 'speedtest' in request.json: |
Jeremy Ronquillo | c743462 | 2021-04-08 21:06:00 -0700 | [diff] [blame] | 828 | if 'ping' in request.json['speedtest']: |
| 829 | req_edge['speedtest']['ping'] = request.json['speedtest']['ping'] |
| 830 | if 'iperf' in request.json['speedtest']: |
| 831 | req_edge['speedtest']['iperf'] = request.json['speedtest']['iperf'] |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 832 | |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 833 | if 'signal_quality' in request.json: |
| 834 | req_edge['signal_quality'] = request.json['signal_quality'] |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 835 | |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 836 | if 'dongle_stats' in request.json: |
| 837 | req_edge['dongle_stats'] = request.json['dongle_stats'] |
| 838 | |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 839 | if 'counters' in request.json: |
| 840 | req_edge['counters'] = request.json['counters'] |
| 841 | |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 842 | edge = [edge for edge in edges if edge['name'] == req_edge['name']] |
| 843 | if len(edge) == 0: |
Andy Bavier | 55dc587 | 2021-05-05 11:31:42 -0700 | [diff] [blame] | 844 | app.logger.info("new edge request " + req_edge['name']) |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 845 | edges.append(req_edge) |
| 846 | else: |
| 847 | edge[0]['status']['control_plane'] = req_edge['status']['control_plane'] |
| 848 | edge[0]['status']['user_plane'] = req_edge['status']['user_plane'] |
Jeremy Ronquillo | f420025 | 2021-02-13 16:11:04 -0800 | [diff] [blame] | 849 | edge[0]['speedtest']['ping'] = req_edge['speedtest']['ping'] |
Jeremy Ronquillo | 56b0a1e | 2021-04-09 00:26:18 -0700 | [diff] [blame] | 850 | edge[0]['speedtest']['iperf'] = req_edge['speedtest']['iperf'] |
Jeremy Ronquillo | c45955a | 2021-11-09 12:04:57 -0800 | [diff] [blame] | 851 | edge[0]['dongle_stats'] = req_edge['dongle_stats'] |
Hyunsun Moon | 200eba5 | 2021-04-05 21:31:54 -0700 | [diff] [blame] | 852 | if 'signal_quality' in req_edge.keys(): |
| 853 | edge[0]['signal_quality'] = req_edge['signal_quality'] |
Shad Ansari | 9faaa96 | 2022-03-16 17:35:41 -0700 | [diff] [blame] | 854 | if 'counters' in req_edge.keys(): |
| 855 | edge[0]['counters'] = req_edge['counters'] |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 856 | edge[0]['last_update'] = req_edge['last_update'] |
| 857 | |
| 858 | return jsonify({'edge': req_edge}), 201 |
| 859 | |
| 860 | |
Hyunsun Moon | 5f237ec | 2020-09-29 14:45:52 -0700 | [diff] [blame] | 861 | @app.route('/edges/<string:name>', methods=['DELETE']) |
Andy Bavier | f872e9a | 2021-03-22 12:06:25 -0700 | [diff] [blame] | 862 | @app.route('/testresults/<string:name>', methods=['DELETE']) |
Hyunsun Moon | 5f237ec | 2020-09-29 14:45:52 -0700 | [diff] [blame] | 863 | def delete_edge(name): |
Andy Bavier | 55dc587 | 2021-05-05 11:31:42 -0700 | [diff] [blame] | 864 | app.logger.info("delete edge request " + name) |
Hyunsun Moon | 5f237ec | 2020-09-29 14:45:52 -0700 | [diff] [blame] | 865 | result = False |
| 866 | for i in range(len(edges)): |
| 867 | if edges[i]['name'] == name: |
| 868 | del edges[i] |
Andy Bavier | e47157d | 2020-12-11 14:13:12 -0700 | [diff] [blame] | 869 | remove_edge_from_metrics(name) |
Hyunsun Moon | 5f237ec | 2020-09-29 14:45:52 -0700 | [diff] [blame] | 870 | result = True |
| 871 | break |
| 872 | if not result: |
| 873 | abort(404) |
| 874 | return jsonify({'result': True}) |
| 875 | |
| 876 | |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 877 | if __name__ == '__main__': |
Andy Bavier | 8a5c987 | 2020-10-21 13:17:53 -0700 | [diff] [blame] | 878 | if SECRET_ICAL_URL and AETHER_ENV: |
Andy Bavier | 55dc587 | 2021-05-05 11:31:42 -0700 | [diff] [blame] | 879 | app.logger.info(" * Starting maintenance calendar polling thread (Aether env: %s)" % AETHER_ENV) |
Andy Bavier | 614af14 | 2020-08-07 14:49:56 -0700 | [diff] [blame] | 880 | t = threading.Thread(target=pull_maintenance_events) |
| 881 | t.start() |
Hyunsun Moon | f32ae9a | 2020-05-28 13:17:45 -0700 | [diff] [blame] | 882 | app.run(debug=True, host='0.0.0.0', port=80) |