Compare commits

..

2 Commits

Author SHA1 Message Date
Abiola Akinnubi 74efc2cb42 bump up version minor number 2025-11-14 18:07:17 -08:00
Abiola Akinnubi db3096bbaf feat AUTO-695: add loaded_at attribute to AutoScalerData and Metrics classes 2025-11-14 17:07:06 -08:00
3 changed files with 3 additions and 4 deletions
+1 -1
View File
@@ -30,7 +30,7 @@ from lib.data_types import (
BenchmarkResult
)
VERSION = "0.2.0"
VERSION = "0.2.1"
MSG_HISTORY_LEN = 100
log = logging.getLogger(__file__)
+1 -1
View File
@@ -146,6 +146,7 @@ class Metrics:
def _set_mtoken(self, mtoken: str) -> None:
self.mtoken = mtoken
#######################################Private#######################################
async def __send_delete_requests_and_reset(self):
@@ -280,7 +281,6 @@ class Metrics:
if sent:
# clear the one-shot loadtime only if we actually sent *this* value
self.system_metrics.reset(expected=loadtime_snapshot)
self.update_pending = False
self.model_metrics.reset()
self.last_metric_update = time.time()
-1
View File
@@ -11,7 +11,6 @@ MODEL_SERVER_START_LOG_MSG = [
"llama runner started", # Ollama
'"message":"Connected","target":"text_generation_router"', # TGI
'"message":"Connected","target":"text_generation_router::server"', # TGI
"main: model loaded" # llama.cpp
]
MODEL_SERVER_ERROR_LOG_MSGS = [