MetaGPT/metagpt/provider/zhipuai_api.py at a87b5056d707c4efde11104768ff9c0702dbed9f · springasa/MetaGPT · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
#!/usr/bin/env python
# -*- coding: utf-8 -*-
# @Desc   : zhipuai LLM from https://open.bigmodel.cn/dev/api#sdk

import json
from enum import Enum

import openai
import zhipuai
from requests import ConnectionError
from tenacity import (
    after_log,
    retry,
    retry_if_exception_type,
    stop_after_attempt,
    wait_random_exponential,
)

from metagpt.config import CONFIG, LLMProviderEnum
from metagpt.logs import log_llm_stream, logger
from metagpt.provider.base_gpt_api import BaseGPTAPI
from metagpt.provider.llm_provider_registry import register_provider
from metagpt.provider.openai_api import CostManager, log_and_reraise
from metagpt.provider.zhipuai.zhipu_model_api import ZhiPuModelAPI


class ZhiPuEvent(Enum):
    ADD = "add"
    ERROR = "error"
    INTERRUPTED = "interrupted"
    FINISH = "finish"


@register_provider(LLMProviderEnum.ZHIPUAI)
class ZhiPuAIGPTAPI(BaseGPTAPI):
    """
    Refs to `https://open.bigmodel.cn/dev/api#chatglm_turbo`
    From now, there is only one model named `chatglm_turbo`
    """

    use_system_prompt: bool = False  # zhipuai has no system prompt when use api

    def __init__(self):
        self.__init_zhipuai(CONFIG)
        self.llm = ZhiPuModelAPI
        self.model = "chatglm_turbo"  # so far only one model, just use it
        self._cost_manager = CostManager()

    def __init_zhipuai(self, config: CONFIG):
        assert config.zhipuai_api_key
        zhipuai.api_key = config.zhipuai_api_key
        openai.api_key = zhipuai.api_key  # due to use openai sdk, set the api_key but it will't be used.
        if config.openai_proxy:
            openai.proxy = config.openai_proxy

    def _const_kwargs(self, messages: list[dict]) -> dict:
        kwargs = {"model": self.model, "prompt": messages, "temperature": 0.3}
        return kwargs

    def _update_costs(self, usage: dict):
        """update each request's token cost"""
        if CONFIG.calc_usage:
            try:
                prompt_tokens = int(usage.get("prompt_tokens", 0))
                completion_tokens = int(usage.get("completion_tokens", 0))
                self._cost_manager.update_cost(prompt_tokens, completion_tokens, self.model)
            except Exception as e:
                logger.error(f"zhipuai updats costs failed! exp: {e}")

    def get_choice_text(self, resp: dict) -> str:
        """get the first text of choice from llm response"""
        assist_msg = resp.get("data", {}).get("choices", [{"role": "error"}])[-1]
        assert assist_msg["role"] == "assistant"
        return assist_msg.get("content")

    def completion(self, messages: list[dict]) -> dict:
        resp = self.llm.invoke(**self._const_kwargs(messages))
        usage = resp.get("data").get("usage")
        self._update_costs(usage)
        return resp

    async def _achat_completion(self, messages: list[dict]) -> dict:
        resp = await self.llm.ainvoke(**self._const_kwargs(messages))
        usage = resp.get("data").get("usage")
        self._update_costs(usage)
        return resp

    async def acompletion(self, messages: list[dict]) -> dict:
        return await self._achat_completion(messages)

    async def _achat_completion_stream(self, messages: list[dict]) -> str:
        response = await self.llm.asse_invoke(**self._const_kwargs(messages))
        collected_content = []
        usage = {}
        async for event in response.async_events():
            if event.event == ZhiPuEvent.ADD.value:
                content = event.data
                collected_content.append(content)
                log_llm_stream(content)
            elif event.event == ZhiPuEvent.ERROR.value or event.event == ZhiPuEvent.INTERRUPTED.value:
                content = event.data
                logger.error(f"event error: {content}", end="")
                collected_content.append([content])
            elif event.event == ZhiPuEvent.FINISH.value:
                """
                event.meta
                    {
                        "task_status":"SUCCESS",
                        "usage":{
                            "completion_tokens":351,
                            "prompt_tokens":595,
                            "total_tokens":946
                        },
                        "task_id":"xx",
                        "request_id":"xxx"
                    }
                """
                meta = json.loads(event.meta)
                usage = meta.get("usage")
            else:
                print(f"zhipuapi else event: {event.data}", end="")

        self._update_costs(usage)
        full_content = "".join(collected_content)
        return full_content

    @retry(
        stop=stop_after_attempt(3),
        wait=wait_random_exponential(min=1, max=60),
        after=after_log(logger, logger.level("WARNING").name),
        retry=retry_if_exception_type(ConnectionError),
        retry_error_callback=log_and_reraise,
    )
    async def acompletion_text(self, messages: list[dict], stream=False) -> str:
        """response in async with stream or non-stream mode"""
        if stream:
            return await self._achat_completion_stream(messages)
        resp = await self._achat_completion(messages)
        return self.get_choice_text(resp)