浏览代码

chore: make prompt generator max tokens configurable (#6693)

tags/0.6.16
Sangmin Ahn 1年前
父节点
当前提交
ecb9c311b5
没有帐户链接到提交者的电子邮件
共有 3 个文件被更改,包括 8 次插入3 次删除
  1. 1
    0
      api/.env.example
  2. 5
    1
      api/controllers/console/app/generator.py
  3. 2
    2
      api/core/llm_generator/llm_generator.py

+ 1
- 0
api/.env.example 查看文件



# Model Configuration # Model Configuration
MULTIMODAL_SEND_IMAGE_FORMAT=base64 MULTIMODAL_SEND_IMAGE_FORMAT=base64
PROMPT_GENERATION_MAX_TOKENS=512


# Mail configuration, support: resend, smtp # Mail configuration, support: resend, smtp
MAIL_TYPE= MAIL_TYPE=

+ 5
- 1
api/controllers/console/app/generator.py 查看文件

import os

from flask_login import current_user from flask_login import current_user
from flask_restful import Resource, reqparse from flask_restful import Resource, reqparse


args = parser.parse_args() args = parser.parse_args()


account = current_user account = current_user
PROMPT_GENERATION_MAX_TOKENS = int(os.getenv('PROMPT_GENERATION_MAX_TOKENS', '512'))


try: try:
rules = LLMGenerator.generate_rule_config( rules = LLMGenerator.generate_rule_config(
tenant_id=account.current_tenant_id, tenant_id=account.current_tenant_id,
instruction=args['instruction'], instruction=args['instruction'],
model_config=args['model_config'], model_config=args['model_config'],
no_variable=args['no_variable']
no_variable=args['no_variable'],
rule_config_max_tokens=PROMPT_GENERATION_MAX_TOKENS
) )
except ProviderTokenNotInitError as ex: except ProviderTokenNotInitError as ex:
raise ProviderNotInitializeError(ex.description) raise ProviderNotInitializeError(ex.description)

+ 2
- 2
api/core/llm_generator/llm_generator.py 查看文件

return questions return questions


@classmethod @classmethod
def generate_rule_config(cls, tenant_id: str, instruction: str, model_config: dict, no_variable: bool) -> dict:
def generate_rule_config(cls, tenant_id: str, instruction: str, model_config: dict, no_variable: bool, rule_config_max_tokens: int = 512) -> dict:
output_parser = RuleConfigGeneratorOutputParser() output_parser = RuleConfigGeneratorOutputParser()


error = "" error = ""
"error": "" "error": ""
} }
model_parameters = { model_parameters = {
"max_tokens": 512,
"max_tokens": rule_config_max_tokens,
"temperature": 0.01 "temperature": 0.01
} }



正在加载...
取消
保存