# -*- coding: utf-8 -*-
"""The manager of monitor module."""
import os
from typing import Any, Optional, List, Union
from pathlib import Path
from loguru import logger
from sqlalchemy import Column, Integer, String, create_engine, text
from sqlalchemy.ext.declarative import declarative_base, DeclarativeMeta
from sqlalchemy.orm import sessionmaker
from ._file import FileManager
from ..utils.common import _is_windows
from ..constants import (
_DEFAULT_SQLITE_DB_NAME,
_DEFAULT_TABLE_NAME_FOR_CHAT_AND_EMBEDDING,
_DEFAULT_TABLE_NAME_FOR_IMAGE,
)
_Base: DeclarativeMeta = declarative_base()
class _ModelTable(_Base): # mypy: ignore
"""The table for invocation records of chat and embedding models."""
__tablename__ = _DEFAULT_TABLE_NAME_FOR_CHAT_AND_EMBEDDING
id = Column(Integer, primary_key=True, autoincrement=True)
model_name = Column(String(50))
prompt_tokens = Column(Integer, default=0)
completion_tokens = Column(Integer, default=0)
total_tokens = Column(Integer, default=0)
class _ImageModelTable(_Base):
"""The table for invocation records of image models."""
__tablename__ = _DEFAULT_TABLE_NAME_FOR_IMAGE
id = Column(Integer, primary_key=True, autoincrement=True)
model_name = Column(String(50))
resolution = Column(String(59))
image_count = Column(Integer, default=0)
[文档]
class MonitorManager:
"""The manager of monitor module."""
_instance = None
def __new__(cls, *args: Any, **kwargs: Any) -> Any:
"""Create a singleton instance."""
if cls._instance is None:
cls._instance = super(MonitorManager, cls).__new__(
cls,
)
else:
raise RuntimeError(
"The monitor manager has been initialized. Try to use "
"MonitorManager.get_instance() to get the instance.",
)
return cls._instance
@property
def path_db(self) -> Union[str, None]:
"""The path to the database"""
run_dir = FileManager.get_instance().run_dir
if run_dir is None:
return None
return os.path.abspath(os.path.join(run_dir, _DEFAULT_SQLITE_DB_NAME))
[文档]
def __init__(self) -> None:
"""Initialize the monitor manager."""
self.use_monitor = False
self.session = None
self.engine = None
# The name of the views
self.view_chat_and_embedding = "view_chat_and_embedding"
self.view_image = "view_image"
[文档]
def initialize(self, use_monitor: bool) -> None:
"""Initialize the monitor manager.
Args:
use_monitor (`bool`):
Whether to use the monitor.
"""
self.use_monitor = use_monitor
if use_monitor:
self._create_monitor_db()
[文档]
@classmethod
def get_instance(cls) -> "MonitorManager":
"""Get the instance of the singleton class."""
if cls._instance is None:
raise ValueError(
"AgentScope hasn't been initialized. Please call "
"`agentscope.init` function first.",
)
return cls._instance
def _print_table(self, title: str, usage: List) -> None:
"""Print the table data."""
# TODO: use a better way to display the table data
if len(usage) == 1:
print_usage = usage + [["-" for _ in range(len(usage[0]))]]
else:
print_usage = usage
max_len_col = []
for i in range(len(print_usage[0])):
max_len_col.append(max(len(str(_[i])) for _ in print_usage))
logger.info(title)
for row in print_usage:
line = "|".join(
[""]
+ [
str(_).center(max_len + 2, " ")
for _, max_len in zip(row, max_len_col)
]
+ [""],
)
logger.info(line)
def _create_monitor_db(self) -> None:
"""Create the database."""
# To avoid path error in windows
if self.path_db is None:
raise RuntimeError(
"The run_dir in file manager is not initialized.",
)
path = Path(os.path.abspath(self.path_db))
if _is_windows():
self.engine = create_engine(f"sqlite:///{str(path)}")
else:
self.engine = create_engine(f"sqlite:////{str(path)}")
# Create tables
_Base.metadata.create_all(self.engine)
with self.engine.connect() as connection:
# Create view for chat and embedding models
create_view_sql = text(
f"""
CREATE VIEW IF NOT EXISTS {self.view_chat_and_embedding} AS
SELECT
model_name,
COUNT(*) AS times,
SUM(prompt_tokens) AS prompt_tokens,
SUM(completion_tokens) AS completion_tokens,
SUM(total_tokens) AS total_tokens
FROM
{_ModelTable.__tablename__}
GROUP BY
model_name;
""",
)
connection.execute(create_view_sql)
# Create new for text-to-image models
create_view_sql = text(
f"""
CREATE VIEW IF NOT EXISTS {self.view_image} AS
SELECT
model_name,
resolution,
COUNT(*) AS times,
SUM(image_count) AS image_count
FROM
{_ImageModelTable.__tablename__}
GROUP BY
model_name, resolution;
""",
)
connection.execute(create_view_sql)
self.session = sessionmaker(bind=self.engine)
def _close_monitor_db(self) -> None:
"""Close the monitor database to avoid file occupation error in
windows."""
if self.session is not None:
self.session.close_all()
if self.engine is not None:
self.engine.dispose()
[文档]
def update_image_tokens(
self,
model_name: str,
resolution: str,
image_count: int,
) -> None:
"""Update the record of the image models."""
if not self.use_monitor:
return
if self.session is None:
raise RuntimeError("The DB session in monitor is not initialized.")
with self.session() as sess:
new_record = _ImageModelTable(
model_name=model_name,
resolution=resolution,
image_count=image_count,
)
sess.add(new_record)
sess.commit()
[文档]
def update_text_and_embedding_tokens(
self,
model_name: str,
prompt_tokens: int = 0,
completion_tokens: int = 0,
total_tokens: Optional[int] = None,
) -> None:
"""Update the tokens of a given model."""
if not self.use_monitor:
return
if self.session is None:
raise RuntimeError("The DB session in monitor is not initialized.")
if total_tokens is not None:
assert total_tokens == prompt_tokens + completion_tokens
with self.session() as sess:
new_record = _ModelTable(
model_name=model_name,
prompt_tokens=prompt_tokens,
completion_tokens=completion_tokens,
total_tokens=total_tokens
or (prompt_tokens + completion_tokens),
)
sess.add(new_record)
sess.commit()
[文档]
def print_llm_usage(self) -> dict:
"""Print the usage of all different model APIs."""
text_and_embedding = self.show_text_and_embedding_tokens()
image = self.show_image_tokens()
return {
"text_and_embedding": text_and_embedding,
"image": image,
}
[文档]
def show_image_tokens(self) -> List[dict]:
"""Show the tokens of all image models."""
usage = []
if self.use_monitor:
with self.engine.connect() as connection:
usage = connection.execute(
text(f"SELECT * FROM {self.view_image}"),
).fetchall()
headers = [
"MODEL NAME",
"RESOLUTION",
"TIMES",
"IMAGE COUNT",
]
usage.insert(0, headers)
self._print_table("Image Model:", usage)
return [
{
"model_name": _[0],
"resolution": _[1],
"times": _[2],
"image_count": _[3],
}
for _ in usage[1:]
]
[文档]
def show_text_and_embedding_tokens(self) -> List[dict]:
"""Show the tokens of all models."""
usage = []
if self.use_monitor:
with self.engine.connect() as connection:
usage = connection.execute(
text(f"SELECT * FROM {self.view_chat_and_embedding}"),
).fetchall()
headers = [
"MODEL NAME",
"TIMES",
"PROMPT TOKENS",
"COMPLETION TOKENS",
"TOTAL TOKENS",
]
usage.insert(0, headers)
self._print_table("Text & Embedding Model:", usage)
return [
{
"model_name": _[0],
"times": _[1],
"prompt_tokens": _[2],
"completion_tokens": _[3],
"total_tokens": _[4],
}
for _ in usage[1:]
]
[文档]
def rm_database(self) -> None:
"""Remove the database."""
if self.path_db is not None and os.path.exists(self.path_db):
os.remove(self.path_db)
[文档]
def state_dict(self) -> dict:
"""Serialize the monitor manager into a dict."""
return {
"use_monitor": self.use_monitor,
"path_db": self.path_db,
}
[文档]
def load_dict(self, data: dict) -> None:
"""Load the monitor manager from a dict."""
assert "use_monitor" in data, "Key 'use_monitor' not found in data."
self.initialize(data["use_monitor"])
[文档]
def flush(self) -> None:
"""Flush the monitor manager."""
# Close the database before flushing
self._close_monitor_db()
self.use_monitor = False
self.session = None
self.engine = None
# The name of the views
self.view_chat_and_embedding = "view_chat_and_embedding"
self.view_image = "view_image"