app-odoo/app_chatgpt/models/ai_robot.py

# -*- coding: utf-8 -*-
import openai.openai_object
import requests, json
import openai
from odoo import api, fields, models, _
from odoo.exceptions import UserError
from .lib.WordsSearch import WordsSearch

import logging
_logger = logging.getLogger(__name__)


class AiRobot(models.Model):
    _name = 'ai.robot'
    _description = 'Gpt Robot'
    _order = 'sequence, name'

    name = fields.Char(string='Name', translate=True, required=True)
    provider = fields.Selection(string="AI Provider", selection=[('openai', 'OpenAI'), ('azure', 'Azure')], required=True, default='openai')
    ai_model = fields.Selection(string="AI Model", selection=[
        ('gpt-4', 'Chatgpt 4'),
        ('gpt-3.5-turbo', 'Chatgpt 3.5 Turbo'),
        ('gpt-3.5-turbo-0301', 'Chatgpt 3.5 Turbo on 20230301'),
        ('text-davinci-003', 'Chatgpt 3 Davinci'),
        ('code-davinci-002', 'Chatgpt 2 Code Optimized'),
        ('text-davinci-002', 'Chatgpt 2 Davinci'),
        ('dall-e2', 'Dall-E Image'),
    ], required=True, default='gpt-3.5-turbo',
                             help="""
GPT-4: Can understand Image, generate natural language or code.
GPT-3.5: A set of models that improve on GPT-3 and can understand as well as generate natural language or code
DALL·E: A model that can generate and edit images given a natural language prompt
Whisper: A model that can convert audio into text
Embeddings:	A set of models that can convert text into a numerical form
CodexLimited: A set of models that can understand and generate code, including translating natural language to code
Moderation: A fine-tuned model that can detect whether text may be sensitive or unsafe
GPT-3	A set of models that can understand and generate natural language
                             """)
    openapi_api_key = fields.Char(string="API Key", help="Provide the API key here")
    # begin gpt 参数
    # 1. stop：表示聊天机器人停止生成回复的条件，可以是一段文本或者一个列表，当聊天机器人生成的回复中包含了这个条件，就会停止继续生成回复。
    # 2. temperature：控制回复的“新颖度”，值越高，聊天机器人生成的回复越不确定和随机，值越低，聊天机器人生成的回复会更加可预测和常规化。
    # 3. top_p：与temperature有些类似，也是控制回复的“新颖度”。不同的是，top_p控制的是回复中概率最高的几个可能性的累计概率之和，值越小，生成的回复越保守，值越大，生成的回复越新颖。
    # 4. frequency_penalty：用于控制聊天机器人回复中出现频率过高的词汇的惩罚程度。聊天机器人会尝试避免在回复中使用频率较高的词汇，以提高回复的多样性和新颖度。
    # 5. presence_penalty：与frequency_penalty相对，用于控制聊天机器人回复中出现频率较低的词汇的惩罚程度。聊天机器人会尝试在回复中使用频率较低的词汇，以提高回复的多样性和新颖度。
    max_tokens = fields.Integer('Max response', default=600,
                                help="""
                                Set a limit on the number of tokens per model response.
                                The API supports a maximum of 4000 tokens shared between the prompt
                                (including system message, examples, message history, and user query) and the model's response.
                                One token is roughly 4 characters for typical English text.
                                """)
    temperature = fields.Float(string='Temperature', default=0.9,
                               help="""
                               Controls randomness. Lowering the temperature means that the model will produce
                               more repetitive and deterministic responses.
                               Increasing the temperature will result in more unexpected or creative responses.
                               Try adjusting temperature or Top P but not both.
                                    """)
    top_p = fields.Float('Top probabilities', default=0.6,
                         help="""
                         Similar to temperature, this controls randomness but uses a different method.
                         Lowering Top P will narrow the model’s token selection to likelier tokens.
                         Increasing Top P will let the model choose from tokens with both high and low likelihood.
                         Try adjusting temperature or Top P but not both
                         """)
    # 避免使用常用词
    frequency_penalty = fields.Float('Frequency penalty', default=0.5,
                                     help="""
                                     Reduce the chance of repeating a token proportionally based on how often it has appeared in the text so far.
                                     This decreases the likelihood of repeating the exact same text in a response.
                                     """)
    # 越大模型就趋向于生成更新的话题，惩罚已经出现过的文本
    presence_penalty = fields.Float('Presence penalty', default=0.5,
                                    help="""
                                    Reduce the chance of repeating any token that has appeared in the text at all so far.
                                    This increases the likelihood of introducing new topics in a response.
                                    """)
    # 停止回复的关键词
    stop = fields.Char('Stop sequences',
                       help="""
                       Use , to separate the stop key word.
                       Make responses stop at a desired point, such as the end of a sentence or list.
                       Specify up to four sequences where the model will stop generating further tokens in a response.
                       The returned text will not contain the stop sequence.
                       """)
    # 角色设定
    sys_content = fields.Char('System message',
                              help="""
                              Give the model instructions about how it should behave and any context it should reference when generating a response.
                              You can describe the assistant’s personality,
                              tell it what it should and shouldn’t answer, and tell it how to format responses.
                              There’s no token limit for this section, but it will be included with every API call,
                              so it counts against the overall token limit.
                              """)
    # end gpt 参数
    endpoint = fields.Char('End Point', default='https://api.openai.com/v1/chat/completions')
    engine = fields.Char('Engine', help='If use Azure, Please input the Model deployment name.')
    api_version = fields.Char('API Version', default='2022-12-01')
    ai_timeout = fields.Integer('Timeout(seconds)', help="Connect timeout for Ai response", default=120)
    sequence = fields.Integer('Sequence', help="Determine the display order", default=10)
    sensitive_words = fields.Text('Sensitive Words Plus', help='Sensitive word filtering. Separate keywords with a carriage return.')
    is_filtering = fields.Boolean('Filter Sensitive Words', default=False, help='Use base Filter in dir models/lib/sensi_words.txt')

    def action_disconnect(self):
        requests.delete('https://chatgpt.com/v1/disconnect')

    def get_ai(self, data, author_id=False, answer_id=False, **kwargs):
        #     通用方法
        # author_id: 请求的 partner_id 对象
        # answer_id: 回答的 partner_id 对象
        # kwargs，dict 形式的可变参数
        self.ensure_one()
        # 前置勾子，一般返回 False，有问题返回响应内容
        res_pre = self.get_ai_pre(data, author_id, answer_id, **kwargs)
        if res_pre:
            return res_pre
        if hasattr(self, 'get_%s' % self.provider):
            res = getattr(self, 'get_%s' % self.provider)(data, author_id, answer_id, **kwargs)
        else:
            res = _('No robot provider found')

        # 后置勾子，返回处理后的内容，用于处理敏感词等
        res_post = self.get_ai_post(res, author_id, answer_id, **kwargs)
        return res_post

    def get_ai_pre(self, data, author_id=False, answer_id=False, **kwargs):
        search = WordsSearch()
        search.SetKeywords([])
        content = data[0]['content']
        sensi = search.FindFirst(content)
        if sensi is not None:
            return _('温馨提示：您发送的内容含有敏感词，请修改内容后再向我发送。')
        else:
            return False

    def get_ai_post(self, res, author_id=False, answer_id=False, **kwargs):
        if res and author_id and isinstance(res, openai.openai_object.OpenAIObject) or isinstance(res, list):
            usage = json.loads(json.dumps(res['usage']))
            content = json.loads(json.dumps(res['choices'][0]['message']['content']))
            data = content.replace(' .', '.').strip()
            if usage:
                # todo: 不是写到 user ，是要写到指定 m2m 相关模型， 如：  res.partner.ai.use
                user_id = author_id.mapped('user_ids')[:1]
                prompt_tokens = usage['prompt_tokens']
                completion_tokens = usage['completion_tokens']
                total_tokens = usage['total_tokens']
                vals = {
                    'human_prompt_tokens': user_id.human_prompt_tokens + prompt_tokens,
                    'ai_completion_tokens': user_id.ai_completion_tokens + completion_tokens,
                    'tokens_total': user_id.tokens_total + total_tokens,
                    'used_number': user_id.used_number + 1,
                }
                if not user_id.first_ask_time:
                    ask_date = fields.Datetime.now()
                    vals.update({
                        'first_ask_time': ask_date
                    })
                user_id.write(vals)
            # res = self.filter_sensitive_words(data)
        else:
            data = res
        return data

    def get_ai_system(self, content=None):
        # 获取基础ai角色设定, role system
        sys_content = content or self.sys_content
        if sys_content:
            return {"role": "system", "content": sys_content}
        return {}

    def get_ai_model_info(self):
        self.ensure_one()
        headers = {"Content-Type": "application/json", "Authorization": f"Bearer {self.openapi_api_key}"}
        R_TIMEOUT = self.ai_timeout or 120
        o_url = "https://api.openai.com/v1/models/%s" % self.ai_model
        if self.endpoint:
            o_url = self.endpoint.replace("/chat/completions", "") + "/models/%s" % self.ai_model

        response = requests.get(o_url, headers=headers, timeout=R_TIMEOUT)
        response.close()
        if response:
            res = response.json()
            r_text = json.dumps(res, indent=2)
        else:
            r_text = 'No response.'
        raise UserError(r_text)

    def get_ai_list_model(self):
        self.ensure_one()
        headers = {"Content-Type": "application/json", "Authorization": f"Bearer {self.openapi_api_key}"}
        R_TIMEOUT = self.ai_timeout or 120
        o_url = "https://api.openai.com/v1/models"
        if self.endpoint:
            o_url = self.endpoint.replace("/chat/completions", "") + "/models"
        response = requests.get(o_url, headers=headers, timeout=R_TIMEOUT)
        response.close()
        if response:
            res = response.json()
            r_text = json.dumps(res, indent=2)
        else:
            r_text = 'No response.'
        raise UserError(r_text)

    def get_openai(self, data, author_id, answer_id, **kwargs):
        self.ensure_one()
        headers = {"Content-Type": "application/json", "Authorization": f"Bearer {self.openapi_api_key}"}
        R_TIMEOUT = self.ai_timeout or 120
        o_url = self.endpoint or "https://api.openai.com/v1/chat/completions"

        if self.stop:
            stop = self.stop.split(',')
        else:
            stop = ["Human:", "AI:"]
        # 以下处理 open ai
        if self.ai_model in ['gpt-3.5-turbo', 'gpt-3.5-turbo-0301']:
            # 基本与 azure 同，要处理 api_base
            openai.api_key = self.openapi_api_key
            openai.api_base = o_url.replace('/chat/completions', '')
            if isinstance(data, list):
                messages = data
            else:
                messages = [{"role": "user", "content": data}]
            # Ai角色设定
            sys_content = self.get_ai_system(kwargs.get('sys_content'))
            if sys_content:
                messages.insert(0, sys_content)
            response = openai.ChatCompletion.create(
                model=self.ai_model,
                messages=messages,
                n=1,
                temperature=self.temperature or 0.9,
                max_tokens=self.max_tokens or 600,
                top_p=self.top_p or 0.6,
                frequency_penalty=self.frequency_penalty or 0.5,
                presence_penalty=self.presence_penalty or 0.5,
                stop=stop,
                request_timeout=self.ai_timeout or 120,
            )
            if 'choices' in response:
                return response
            else:
                _logger.warning('=====================Openai output data: %s' % response)
        elif self.ai_model == 'dall-e2':
            # todo: 处理 图像引擎，主要是返回参数到聊天中
            # image_url = response['data'][0]['url']
            # https://platform.openai.com/docs/guides/images/introduction
            pdata = {
                "prompt": data,
                "n": 3,
                "size": "1024x1024",
            }
            return '建设中'
        else:
            pdata = {
                "model": self.ai_model,
                "prompt": data,
                "temperature": 0.9,
                "max_tokens": self.max_tokens or 1000,
                "top_p": 1,
                "frequency_penalty": 0.0,
                "presence_penalty": 0.6,
                "stop": ["Human:", "AI:"]
            }
            response = requests.post(o_url, data=json.dumps(pdata), headers=headers, timeout=R_TIMEOUT)
            res = response.json()
            if 'choices' in res:
                res = '\n'.join([x['text'] for x in res['choices']])
                return res

        return _("Response Timeout, please speak again.")

    def get_azure(self, data, author_id, answer_id, **kwargs):
        self.ensure_one()
        # only for azure
        openai.api_type = self.provider
        if not self.endpoint:
            raise UserError(_("Please Set your AI robot's endpoint first."))
        openai.api_base = self.endpoint
        if not self.api_version:
            raise UserError(_("Please Set your AI robot's API Version first."))
        openai.api_version = self.api_version
        openai.api_key = self.openapi_api_key
        if self.stop:
            stop = self.stop.split(',')
        else:
            stop = ["Human:", "AI:"]
        if isinstance(data, list):
            messages = data
        else:
            messages = [{"role": "user", "content": data}]
        # Ai角色设定
        sys_content = self.get_ai_system(kwargs.get('sys_content'))
        if sys_content:
            messages.insert(0, sys_content)
        response = openai.ChatCompletion.create(
            engine=self.engine,
            messages=messages,
            # 返回的回答数量
            n=1,
            temperature=self.temperature or 0.9,
            max_tokens=self.max_tokens or 600,
            top_p=self.top_p or 0.6,
            frequency_penalty=self.frequency_penalty or 0.5,
            presence_penalty=self.presence_penalty or 0.5,
            stop=stop,
            request_timeout=self.ai_timeout or 120,
        )
        if 'choices' in response:
            return response
        else:
            _logger.warning('=====================azure output data: %s' % response)
        return _("Response Timeout, please speak again.")

    @api.onchange('provider')
    def _onchange_provider(self):
        if self.provider == 'openai':
            self.endpoint = 'https://api.openai.com/v1/chat/completions'
        elif self.provider == 'azure':
            self.endpoint = 'https://odoo.openai.azure.com'

    def filter_sensitive_words(self, data):
        if self.is_filtering:
            search = WordsSearch()
            s = self.sensitive_words
            if s:
                search.SetKeywords(s.split('\n'))
            else:
                search.SetKeywords([])
            data = search.Replace(text=data)
            return data
        else:
            return data