|
import json |
|
import re |
|
from ast import literal_eval |
|
from typing import Any, List, Union |
|
|
|
|
|
class ParseError(Exception): |
|
"""Parsing exception class.""" |
|
|
|
def __init__(self, err_msg: str): |
|
self.err_msg = err_msg |
|
|
|
|
|
class BaseParser: |
|
"""Base parser to process inputs and outputs of actions. |
|
|
|
Args: |
|
action (:class:`BaseAction`): action to validate |
|
|
|
Attributes: |
|
PARAMETER_DESCRIPTION (:class:`str`): declare the input format which |
|
LLMs should follow when generating arguments for decided tools. |
|
""" |
|
|
|
PARAMETER_DESCRIPTION: str = '' |
|
|
|
def __init__(self, action): |
|
self.action = action |
|
self._api2param = {} |
|
self._api2required = {} |
|
|
|
if action.description: |
|
for api in action.description.get('api_list', |
|
[action.description]): |
|
name = (f'{action.name}.{api["name"]}' |
|
if self.action.is_toolkit else api['name']) |
|
required_parameters = set(api['required']) |
|
all_parameters = {j['name'] for j in api['parameters']} |
|
if not required_parameters.issubset(all_parameters): |
|
raise ValueError( |
|
f'unknown parameters for function "{name}": ' |
|
f'{required_parameters - all_parameters}') |
|
if self.PARAMETER_DESCRIPTION: |
|
api['parameter_description'] = self.PARAMETER_DESCRIPTION |
|
api_name = api['name'] if self.action.is_toolkit else 'run' |
|
self._api2param[api_name] = api['parameters'] |
|
self._api2required[api_name] = api['required'] |
|
|
|
def parse_inputs(self, inputs: str, name: str = 'run') -> dict: |
|
"""Parse inputs LLMs generate for the action. |
|
|
|
Args: |
|
inputs (:class:`str`): input string extracted from responses |
|
|
|
Returns: |
|
:class:`dict`: processed input |
|
""" |
|
inputs = {self._api2param[name][0]['name']: inputs} |
|
return inputs |
|
|
|
def parse_outputs(self, outputs: Any) -> List[dict]: |
|
"""Parser outputs returned by the action. |
|
|
|
Args: |
|
outputs (:class:`Any`): raw output of the action |
|
|
|
Returns: |
|
:class:`List[dict]`: processed output of which each member is a |
|
dictionary with two keys - 'type' and 'content'. |
|
""" |
|
if isinstance(outputs, dict): |
|
outputs = json.dumps(outputs, ensure_ascii=False) |
|
elif not isinstance(outputs, str): |
|
outputs = str(outputs) |
|
return [{ |
|
'type': 'text', |
|
'content': outputs.encode('gbk', 'ignore').decode('gbk') |
|
}] |
|
|
|
|
|
class JsonParser(BaseParser): |
|
"""Json parser to convert input string into a dictionary. |
|
|
|
Args: |
|
action (:class:`BaseAction`): action to validate |
|
""" |
|
|
|
PARAMETER_DESCRIPTION = ( |
|
'If you call this tool, you must pass arguments in ' |
|
'the JSON format {key: value}, where the key is the parameter name.') |
|
|
|
def parse_inputs(self, |
|
inputs: Union[str, dict], |
|
name: str = 'run') -> dict: |
|
if not isinstance(inputs, dict): |
|
try: |
|
match = re.search(r'^\s*(```json\n)?(.*)\n```\s*$', inputs, |
|
re.S) |
|
if match: |
|
inputs = match.group(2).strip() |
|
inputs = json.loads(inputs) |
|
except json.JSONDecodeError as exc: |
|
raise ParseError(f'invalid json format: {inputs}') from exc |
|
input_keys = set(inputs) |
|
all_keys = {param['name'] for param in self._api2param[name]} |
|
if not input_keys.issubset(all_keys): |
|
raise ParseError(f'unknown arguments: {input_keys - all_keys}') |
|
required_keys = set(self._api2required[name]) |
|
if not input_keys.issuperset(required_keys): |
|
raise ParseError( |
|
f'missing required arguments: {required_keys - input_keys}') |
|
return inputs |
|
|
|
|
|
class TupleParser(BaseParser): |
|
"""Tuple parser to convert input string into a tuple. |
|
|
|
Args: |
|
action (:class:`BaseAction`): action to validate |
|
""" |
|
|
|
PARAMETER_DESCRIPTION = ( |
|
'If you call this tool, you must pass arguments in the tuple format ' |
|
'like (arg1, arg2, arg3), and the arguments are ordered.') |
|
|
|
def parse_inputs(self, |
|
inputs: Union[str, tuple], |
|
name: str = 'run') -> dict: |
|
if not isinstance(inputs, tuple): |
|
try: |
|
inputs = literal_eval(inputs) |
|
except Exception as exc: |
|
raise ParseError(f'invalid tuple format: {inputs}') from exc |
|
if len(inputs) < len(self._api2required[name]): |
|
raise ParseError( |
|
f'API takes {len(self._api2required[name])} required positional ' |
|
f'arguments but {len(inputs)} were given') |
|
if len(inputs) > len(self._api2param[name]): |
|
raise ParseError( |
|
f'API takes {len(self._api2param[name])} positional arguments ' |
|
f'but {len(inputs)} were given') |
|
inputs = { |
|
self._api2param[name][i]['name']: item |
|
for i, item in enumerate(inputs) |
|
} |
|
return inputs |
|
|