|
import time
|
|
|
|
from pydantic import BaseModel, Field
|
|
|
|
|
|
class Cost(BaseModel):
|
|
model: str
|
|
cost: float
|
|
timestamp: float = Field(default_factory=time.time)
|
|
|
|
|
|
class ResponseLatency(BaseModel):
|
|
"""Metric tracking the round-trip time per completion call."""
|
|
|
|
model: str
|
|
latency: float
|
|
response_id: str
|
|
|
|
|
|
class Metrics:
|
|
"""Metrics class can record various metrics during running and evaluation.
|
|
Currently, we define the following metrics:
|
|
accumulated_cost: the total cost (USD $) of the current LLM.
|
|
response_latency: the time taken for each LLM completion call.
|
|
"""
|
|
|
|
def __init__(self, model_name: str = 'default') -> None:
|
|
self._accumulated_cost: float = 0.0
|
|
self._costs: list[Cost] = []
|
|
self._response_latencies: list[ResponseLatency] = []
|
|
self.model_name = model_name
|
|
|
|
@property
|
|
def accumulated_cost(self) -> float:
|
|
return self._accumulated_cost
|
|
|
|
@accumulated_cost.setter
|
|
def accumulated_cost(self, value: float) -> None:
|
|
if value < 0:
|
|
raise ValueError('Total cost cannot be negative.')
|
|
self._accumulated_cost = value
|
|
|
|
@property
|
|
def costs(self) -> list[Cost]:
|
|
return self._costs
|
|
|
|
@property
|
|
def response_latencies(self) -> list[ResponseLatency]:
|
|
if not hasattr(self, '_response_latencies'):
|
|
self._response_latencies = []
|
|
return self._response_latencies
|
|
|
|
@response_latencies.setter
|
|
def response_latencies(self, value: list[ResponseLatency]) -> None:
|
|
self._response_latencies = value
|
|
|
|
def add_cost(self, value: float) -> None:
|
|
if value < 0:
|
|
raise ValueError('Added cost cannot be negative.')
|
|
self._accumulated_cost += value
|
|
self._costs.append(Cost(cost=value, model=self.model_name))
|
|
|
|
def add_response_latency(self, value: float, response_id: str) -> None:
|
|
self._response_latencies.append(
|
|
ResponseLatency(
|
|
latency=max(0.0, value), model=self.model_name, response_id=response_id
|
|
)
|
|
)
|
|
|
|
def merge(self, other: 'Metrics') -> None:
|
|
self._accumulated_cost += other.accumulated_cost
|
|
self._costs += other._costs
|
|
self._response_latencies += other._response_latencies
|
|
|
|
def get(self) -> dict:
|
|
"""Return the metrics in a dictionary."""
|
|
return {
|
|
'accumulated_cost': self._accumulated_cost,
|
|
'costs': [cost.model_dump() for cost in self._costs],
|
|
'response_latencies': [
|
|
latency.model_dump() for latency in self._response_latencies
|
|
],
|
|
}
|
|
|
|
def reset(self):
|
|
self._accumulated_cost = 0.0
|
|
self._costs = []
|
|
self._response_latencies = []
|
|
|
|
def log(self):
|
|
"""Log the metrics."""
|
|
metrics = self.get()
|
|
logs = ''
|
|
for key, value in metrics.items():
|
|
logs += f'{key}: {value}\n'
|
|
return logs
|
|
|
|
def __repr__(self):
|
|
return f'Metrics({self.get()}'
|
|
|