| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254 |
- #
- # Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- #
- import os
- from datetime import date
- from enum import IntEnum, Enum
- from api.utils.file_utils import get_project_base_directory
- from api.utils.log_utils import LoggerFactory, getLogger
-
- # Logger
- LoggerFactory.set_directory(
- os.path.join(
- get_project_base_directory(),
- "logs",
- "api"))
- # {CRITICAL: 50, FATAL:50, ERROR:40, WARNING:30, WARN:30, INFO:20, DEBUG:10, NOTSET:0}
- LoggerFactory.LEVEL = 30
-
- stat_logger = getLogger("stat")
- access_logger = getLogger("access")
- database_logger = getLogger("database")
- chat_logger = getLogger("chat")
-
- from rag.utils.es_conn import ELASTICSEARCH
- from rag.nlp import search
- from graphrag import search as kg_search
- from api.utils import get_base_config, decrypt_database_config
-
- API_VERSION = "v1"
- RAG_FLOW_SERVICE_NAME = "ragflow"
- SERVER_MODULE = "rag_flow_server.py"
- TEMP_DIRECTORY = os.path.join(get_project_base_directory(), "temp")
- RAG_FLOW_CONF_PATH = os.path.join(get_project_base_directory(), "conf")
- LIGHTEN = int(os.environ.get('LIGHTEN', "0"))
-
- SUBPROCESS_STD_LOG_NAME = "std.log"
-
- ERROR_REPORT = True
- ERROR_REPORT_WITH_PATH = False
-
- MAX_TIMESTAMP_INTERVAL = 60
- SESSION_VALID_PERIOD = 7 * 24 * 60 * 60
-
- REQUEST_TRY_TIMES = 3
- REQUEST_WAIT_SEC = 2
- REQUEST_MAX_WAIT_SEC = 300
-
- USE_REGISTRY = get_base_config("use_registry")
-
- LLM = get_base_config("user_default_llm", {})
- LLM_FACTORY = LLM.get("factory", "Tongyi-Qianwen")
- LLM_BASE_URL = LLM.get("base_url")
-
- if not LIGHTEN:
- default_llm = {
- "Tongyi-Qianwen": {
- "chat_model": "qwen-plus",
- "embedding_model": "text-embedding-v2",
- "image2text_model": "qwen-vl-max",
- "asr_model": "paraformer-realtime-8k-v1",
- },
- "OpenAI": {
- "chat_model": "gpt-3.5-turbo",
- "embedding_model": "text-embedding-ada-002",
- "image2text_model": "gpt-4-vision-preview",
- "asr_model": "whisper-1",
- },
- "Azure-OpenAI": {
- "chat_model": "gpt-35-turbo",
- "embedding_model": "text-embedding-ada-002",
- "image2text_model": "gpt-4-vision-preview",
- "asr_model": "whisper-1",
- },
- "ZHIPU-AI": {
- "chat_model": "glm-3-turbo",
- "embedding_model": "embedding-2",
- "image2text_model": "glm-4v",
- "asr_model": "",
- },
- "Ollama": {
- "chat_model": "qwen-14B-chat",
- "embedding_model": "flag-embedding",
- "image2text_model": "",
- "asr_model": "",
- },
- "Moonshot": {
- "chat_model": "moonshot-v1-8k",
- "embedding_model": "",
- "image2text_model": "",
- "asr_model": "",
- },
- "DeepSeek": {
- "chat_model": "deepseek-chat",
- "embedding_model": "",
- "image2text_model": "",
- "asr_model": "",
- },
- "VolcEngine": {
- "chat_model": "",
- "embedding_model": "",
- "image2text_model": "",
- "asr_model": "",
- },
- "BAAI": {
- "chat_model": "",
- "embedding_model": "BAAI/bge-large-zh-v1.5",
- "image2text_model": "",
- "asr_model": "",
- "rerank_model": "BAAI/bge-reranker-v2-m3",
- }
- }
-
- CHAT_MDL = default_llm[LLM_FACTORY]["chat_model"]
- EMBEDDING_MDL = default_llm["BAAI"]["embedding_model"]
- RERANK_MDL = default_llm["BAAI"]["rerank_model"]
- ASR_MDL = default_llm[LLM_FACTORY]["asr_model"]
- IMAGE2TEXT_MDL = default_llm[LLM_FACTORY]["image2text_model"]
- else:
- CHAT_MDL = EMBEDDING_MDL = RERANK_MDL = ASR_MDL = IMAGE2TEXT_MDL = ""
-
- API_KEY = LLM.get("api_key", "")
- PARSERS = LLM.get(
- "parsers",
- "naive:General,qa:Q&A,resume:Resume,manual:Manual,table:Table,paper:Paper,book:Book,laws:Laws,presentation:Presentation,picture:Picture,one:One,audio:Audio,knowledge_graph:Knowledge Graph,email:Email")
-
- # distribution
- DEPENDENT_DISTRIBUTION = get_base_config("dependent_distribution", False)
- RAG_FLOW_UPDATE_CHECK = False
-
- HOST = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("host", "127.0.0.1")
- HTTP_PORT = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("http_port")
-
- SECRET_KEY = get_base_config(
- RAG_FLOW_SERVICE_NAME,
- {}).get("secret_key", str(date.today()))
-
- TOKEN_EXPIRE_IN = get_base_config(
- RAG_FLOW_SERVICE_NAME, {}).get(
- "token_expires_in", 3600)
-
- NGINX_HOST = get_base_config(
- RAG_FLOW_SERVICE_NAME, {}).get(
- "nginx", {}).get("host") or HOST
- NGINX_HTTP_PORT = get_base_config(
- RAG_FLOW_SERVICE_NAME, {}).get(
- "nginx", {}).get("http_port") or HTTP_PORT
-
- RANDOM_INSTANCE_ID = get_base_config(
- RAG_FLOW_SERVICE_NAME, {}).get(
- "random_instance_id", False)
-
- PROXY = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("proxy")
- PROXY_PROTOCOL = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("protocol")
-
- DATABASE_TYPE = os.getenv("DB_TYPE", 'mysql')
- DATABASE = decrypt_database_config(name=DATABASE_TYPE)
-
- # Switch
- # upload
- UPLOAD_DATA_FROM_CLIENT = True
-
- # authentication
- AUTHENTICATION_CONF = get_base_config("authentication", {})
-
- # client
- CLIENT_AUTHENTICATION = AUTHENTICATION_CONF.get(
- "client", {}).get(
- "switch", False)
- HTTP_APP_KEY = AUTHENTICATION_CONF.get("client", {}).get("http_app_key")
- GITHUB_OAUTH = get_base_config("oauth", {}).get("github")
- FEISHU_OAUTH = get_base_config("oauth", {}).get("feishu")
- WECHAT_OAUTH = get_base_config("oauth", {}).get("wechat")
-
- # site
- SITE_AUTHENTICATION = AUTHENTICATION_CONF.get("site", {}).get("switch", False)
-
- # permission
- PERMISSION_CONF = get_base_config("permission", {})
- PERMISSION_SWITCH = PERMISSION_CONF.get("switch")
- COMPONENT_PERMISSION = PERMISSION_CONF.get("component")
- DATASET_PERMISSION = PERMISSION_CONF.get("dataset")
-
- HOOK_MODULE = get_base_config("hook_module")
- HOOK_SERVER_NAME = get_base_config("hook_server_name")
-
- ENABLE_MODEL_STORE = get_base_config('enable_model_store', False)
- # authentication
- USE_AUTHENTICATION = False
- USE_DATA_AUTHENTICATION = False
- AUTOMATIC_AUTHORIZATION_OUTPUT_DATA = True
- USE_DEFAULT_TIMEOUT = False
- AUTHENTICATION_DEFAULT_TIMEOUT = 7 * 24 * 60 * 60 # s
- PRIVILEGE_COMMAND_WHITELIST = []
- CHECK_NODES_IDENTITY = False
-
- retrievaler = search.Dealer(ELASTICSEARCH)
- kg_retrievaler = kg_search.KGSearch(ELASTICSEARCH)
-
-
- class CustomEnum(Enum):
- @classmethod
- def valid(cls, value):
- try:
- cls(value)
- return True
- except BaseException:
- return False
-
- @classmethod
- def values(cls):
- return [member.value for member in cls.__members__.values()]
-
- @classmethod
- def names(cls):
- return [member.name for member in cls.__members__.values()]
-
-
- class PythonDependenceName(CustomEnum):
- Rag_Source_Code = "python"
- Python_Env = "miniconda"
-
-
- class ModelStorage(CustomEnum):
- REDIS = "redis"
- MYSQL = "mysql"
-
-
- class RetCode(IntEnum, CustomEnum):
- SUCCESS = 0
- NOT_EFFECTIVE = 10
- EXCEPTION_ERROR = 100
- ARGUMENT_ERROR = 101
- DATA_ERROR = 102
- OPERATING_ERROR = 103
- CONNECTION_ERROR = 105
- RUNNING = 106
- PERMISSION_ERROR = 108
- AUTHENTICATION_ERROR = 109
- UNAUTHORIZED = 401
- SERVER_ERROR = 500
- FORBIDDEN = 403
- NOT_FOUND = 404
|