You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

settings.py 6.7KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220
  1. #
  2. # Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. #
  16. from rag.utils import ELASTICSEARCH
  17. from rag.nlp import search
  18. import os
  19. from enum import IntEnum, Enum
  20. from api.utils import get_base_config, decrypt_database_config
  21. from api.utils.file_utils import get_project_base_directory
  22. from api.utils.log_utils import LoggerFactory, getLogger
  23. # Logger
  24. LoggerFactory.set_directory(
  25. os.path.join(
  26. get_project_base_directory(),
  27. "logs",
  28. "api"))
  29. # {CRITICAL: 50, FATAL:50, ERROR:40, WARNING:30, WARN:30, INFO:20, DEBUG:10, NOTSET:0}
  30. LoggerFactory.LEVEL = 10
  31. stat_logger = getLogger("stat")
  32. access_logger = getLogger("access")
  33. database_logger = getLogger("database")
  34. chat_logger = getLogger("chat")
  35. API_VERSION = "v1"
  36. RAG_FLOW_SERVICE_NAME = "ragflow"
  37. SERVER_MODULE = "rag_flow_server.py"
  38. TEMP_DIRECTORY = os.path.join(get_project_base_directory(), "temp")
  39. RAG_FLOW_CONF_PATH = os.path.join(get_project_base_directory(), "conf")
  40. SUBPROCESS_STD_LOG_NAME = "std.log"
  41. ERROR_REPORT = True
  42. ERROR_REPORT_WITH_PATH = False
  43. MAX_TIMESTAMP_INTERVAL = 60
  44. SESSION_VALID_PERIOD = 7 * 24 * 60 * 60
  45. REQUEST_TRY_TIMES = 3
  46. REQUEST_WAIT_SEC = 2
  47. REQUEST_MAX_WAIT_SEC = 300
  48. USE_REGISTRY = get_base_config("use_registry")
  49. default_llm = {
  50. "Tongyi-Qianwen": {
  51. "chat_model": "qwen-plus",
  52. "embedding_model": "text-embedding-v2",
  53. "image2text_model": "qwen-vl-max",
  54. "asr_model": "paraformer-realtime-8k-v1",
  55. },
  56. "OpenAI": {
  57. "chat_model": "gpt-3.5-turbo",
  58. "embedding_model": "text-embedding-ada-002",
  59. "image2text_model": "gpt-4-vision-preview",
  60. "asr_model": "whisper-1",
  61. },
  62. "ZHIPU-AI": {
  63. "chat_model": "glm-3-turbo",
  64. "embedding_model": "embedding-2",
  65. "image2text_model": "glm-4v",
  66. "asr_model": "",
  67. },
  68. "Local": {
  69. "chat_model": "qwen-14B-chat",
  70. "embedding_model": "flag-embedding",
  71. "image2text_model": "",
  72. "asr_model": "",
  73. },
  74. "Moonshot": {
  75. "chat_model": "moonshot-v1-8k",
  76. "embedding_model": "",
  77. "image2text_model": "",
  78. "asr_model": "",
  79. }
  80. }
  81. LLM = get_base_config("user_default_llm", {})
  82. LLM_FACTORY = LLM.get("factory", "Tongyi-Qianwen")
  83. if LLM_FACTORY not in default_llm:
  84. print(
  85. "\33[91m【ERROR】\33[0m:",
  86. f"LLM factory {LLM_FACTORY} has not supported yet, switch to 'Tongyi-Qianwen/QWen' automatically, and please check the API_KEY in service_conf.yaml.")
  87. LLM_FACTORY = "Tongyi-Qianwen"
  88. CHAT_MDL = default_llm[LLM_FACTORY]["chat_model"]
  89. EMBEDDING_MDL = default_llm[LLM_FACTORY]["embedding_model"]
  90. ASR_MDL = default_llm[LLM_FACTORY]["asr_model"]
  91. IMAGE2TEXT_MDL = default_llm[LLM_FACTORY]["image2text_model"]
  92. API_KEY = LLM.get("api_key", "")
  93. PARSERS = LLM.get(
  94. "parsers",
  95. "naive:General,qa:Q&A,resume:Resume,manual:Manual,table:Table,paper:Paper,book:Book,laws:Laws,presentation:Presentation,picture:Picture,one:One")
  96. # distribution
  97. DEPENDENT_DISTRIBUTION = get_base_config("dependent_distribution", False)
  98. RAG_FLOW_UPDATE_CHECK = False
  99. HOST = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("host", "127.0.0.1")
  100. HTTP_PORT = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("http_port")
  101. SECRET_KEY = get_base_config(
  102. RAG_FLOW_SERVICE_NAME,
  103. {}).get(
  104. "secret_key",
  105. "infiniflow")
  106. TOKEN_EXPIRE_IN = get_base_config(
  107. RAG_FLOW_SERVICE_NAME, {}).get(
  108. "token_expires_in", 3600)
  109. NGINX_HOST = get_base_config(
  110. RAG_FLOW_SERVICE_NAME, {}).get(
  111. "nginx", {}).get("host") or HOST
  112. NGINX_HTTP_PORT = get_base_config(
  113. RAG_FLOW_SERVICE_NAME, {}).get(
  114. "nginx", {}).get("http_port") or HTTP_PORT
  115. RANDOM_INSTANCE_ID = get_base_config(
  116. RAG_FLOW_SERVICE_NAME, {}).get(
  117. "random_instance_id", False)
  118. PROXY = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("proxy")
  119. PROXY_PROTOCOL = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("protocol")
  120. DATABASE = decrypt_database_config(name="mysql")
  121. # Switch
  122. # upload
  123. UPLOAD_DATA_FROM_CLIENT = True
  124. # authentication
  125. AUTHENTICATION_CONF = get_base_config("authentication", {})
  126. # client
  127. CLIENT_AUTHENTICATION = AUTHENTICATION_CONF.get(
  128. "client", {}).get(
  129. "switch", False)
  130. HTTP_APP_KEY = AUTHENTICATION_CONF.get("client", {}).get("http_app_key")
  131. GITHUB_OAUTH = get_base_config("oauth", {}).get("github")
  132. WECHAT_OAUTH = get_base_config("oauth", {}).get("wechat")
  133. # site
  134. SITE_AUTHENTICATION = AUTHENTICATION_CONF.get("site", {}).get("switch", False)
  135. # permission
  136. PERMISSION_CONF = get_base_config("permission", {})
  137. PERMISSION_SWITCH = PERMISSION_CONF.get("switch")
  138. COMPONENT_PERMISSION = PERMISSION_CONF.get("component")
  139. DATASET_PERMISSION = PERMISSION_CONF.get("dataset")
  140. HOOK_MODULE = get_base_config("hook_module")
  141. HOOK_SERVER_NAME = get_base_config("hook_server_name")
  142. ENABLE_MODEL_STORE = get_base_config('enable_model_store', False)
  143. # authentication
  144. USE_AUTHENTICATION = False
  145. USE_DATA_AUTHENTICATION = False
  146. AUTOMATIC_AUTHORIZATION_OUTPUT_DATA = True
  147. USE_DEFAULT_TIMEOUT = False
  148. AUTHENTICATION_DEFAULT_TIMEOUT = 7 * 24 * 60 * 60 # s
  149. PRIVILEGE_COMMAND_WHITELIST = []
  150. CHECK_NODES_IDENTITY = False
  151. retrievaler = search.Dealer(ELASTICSEARCH)
  152. class CustomEnum(Enum):
  153. @classmethod
  154. def valid(cls, value):
  155. try:
  156. cls(value)
  157. return True
  158. except BaseException:
  159. return False
  160. @classmethod
  161. def values(cls):
  162. return [member.value for member in cls.__members__.values()]
  163. @classmethod
  164. def names(cls):
  165. return [member.name for member in cls.__members__.values()]
  166. class PythonDependenceName(CustomEnum):
  167. Rag_Source_Code = "python"
  168. Python_Env = "miniconda"
  169. class ModelStorage(CustomEnum):
  170. REDIS = "redis"
  171. MYSQL = "mysql"
  172. class RetCode(IntEnum, CustomEnum):
  173. SUCCESS = 0
  174. NOT_EFFECTIVE = 10
  175. EXCEPTION_ERROR = 100
  176. ARGUMENT_ERROR = 101
  177. DATA_ERROR = 102
  178. OPERATING_ERROR = 103
  179. CONNECTION_ERROR = 105
  180. RUNNING = 106
  181. PERMISSION_ERROR = 108
  182. AUTHENTICATION_ERROR = 109
  183. SERVER_ERROR = 500