Skip to content

Commit e42e7e6

Browse files
committed
update prom metrics
Signed-off-by: Praneeth Bedapudi <[email protected]>
1 parent e84f232 commit e42e7e6

File tree

4 files changed

+27
-23
lines changed

4 files changed

+27
-23
lines changed

fastdeploy/_loop.py

+15
Original file line numberDiff line numberDiff line change
@@ -186,6 +186,8 @@ def start_loop(
186186
"""
187187
)
188188

189+
prediction_loop_started_at = time.time()
190+
189191
while True:
190192
"""
191193
Set timedout_in_queue to True for all the predictions that have been in the queue for more than timeout_time seconds
@@ -226,9 +228,12 @@ def start_loop(
226228

227229
_utils.logger.debug(f"Processing batch {unique_id_wise_input_count}")
228230

231+
process_batch_started_at = time.time()
229232
results, last_predictor_success, received_at, predicted_at = process_batch(
230233
predictor, input_batch, optimal_batch_size
231234
)
235+
process_batch_ended_at = time.time()
236+
232237
unique_id_wise_results = prepare_results(
233238
unique_id_wise_input_count,
234239
results,
@@ -244,6 +249,16 @@ def start_loop(
244249
f"Updated results predictor {predictor_sequence}: {list(unique_id_wise_results)}"
245250
)
246251

252+
_utils.GLOBAL_METRICS_INDEX.math(
253+
"total_predictor_run_for_hours",
254+
(process_batch_ended_at - process_batch_started_at) / 3600,
255+
"+=",
256+
)
257+
258+
_utils.GLOBAL_METRICS_INDEX["total_predictor_up_for_hours"] = (
259+
time.time() - prediction_loop_started_at
260+
) / 3600
261+
247262

248263
if __name__ == "__main__":
249264
import sys

fastdeploy/_rest.py

+6-22
Original file line numberDiff line numberDiff line change
@@ -251,17 +251,13 @@ def on_get(self, req, resp):
251251
) / requests_received_in_last_x_seconds_that_are_successful
252252

253253
prometheus_text = f"""
254-
# HELP pending_requests The number of pending requests.
255-
# TYPE pending_requests gauge
256-
pending_requests {_utils.MAIN_INDEX.count(query={"-1.predicted_at": 0, "last_predictor_success": True})}
254+
# HELP total_predictor_run_for_hours Total hours the predictor has been actively running predictions since start.
255+
# TYPE total_predictor_run_for_hours counter
256+
total_predictor_run_for_hours {_utils.GLOBAL_METRICS_INDEX["total_predictor_run_for_hours"]}
257257
258-
# HELP failed_requests The number of failed requests.
259-
# TYPE failed_requests gauge
260-
failed_requests {_utils.MAIN_INDEX.count(query={"last_predictor_success": False})}
261-
262-
# HELP successful_requests The number of failed requests.
263-
# TYPE successful_requests gauge
264-
successful_requests {_utils.MAIN_INDEX.count(query={"-1.predicted_at": {"$ne": 0}, "last_predictor_success": True})}
258+
# HELP total_predictor_up_for_hours Total hours the predictor has been up since start.
259+
# TYPE total_predictor_up_for_hours counter
260+
total_predictor_up_for_hours {_utils.GLOBAL_METRICS_INDEX["total_predictor_up_for_hours"]}
265261
266262
# HELP requests_received_in_last_x_seconds The number of requests received in last {_LAST_X_SECONDS} seconds.
267263
# TYPE requests_received_in_last_x_seconds gauge
@@ -394,18 +390,6 @@ def on_get(self, req, resp):
394390
}
395391

396392

397-
class Failed(object):
398-
def on_get(self, req, resp):
399-
last_n_failed = int(req.params.get("last_n_failed", 10))
400-
failed_inputs = _utils.MAIN_INDEX.search(
401-
query={"last_predictor_success": False},
402-
n=last_n_failed,
403-
select_keys=["-1.inputs"],
404-
)
405-
406-
resp.media = failed_inputs
407-
408-
409393
app = falcon.App(
410394
middleware=falcon.CORSMiddleware(allow_origins="*", allow_credentials="*"),
411395
)

fastdeploy/_utils.py

+5
Original file line numberDiff line numberDiff line change
@@ -114,6 +114,11 @@
114114
MAIN_INDEX.optimize_for_query(["timedout_in_queue"])
115115

116116

117+
GLOBAL_METRICS_INDEX = KVIndex(os.path.join("fastdeploy_dbs", f"global_metrics_index.db"))
118+
GLOBAL_METRICS_INDEX["total_predictor_run_for_hours"] = 0
119+
GLOBAL_METRICS_INDEX["total_predictor_up_for_hours"] = 0
120+
121+
117122
def warmup(predictor, example_input, n=3):
118123
"""
119124
Run warmup prediction on the model.

setup.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818
1919
AUTHOR = "BEDAPUDI PRANEETH"
2020
REQUIRES_PYTHON = ">=3.6.0"
21-
VERSION = "3.0.22"
21+
VERSION = "3.0.23"
2222

2323
# What packages are required for this module to be executed?
2424
REQUIRED = ["falcon", "liteindex==0.0.3.2.dev4", "zstandard", "gunicorn[gevent]", "msgpack"]

0 commit comments

Comments
 (0)