Nevar pievienot vairāk kā 25 tēmas Tēmai ir jāsākas ar burtu vai ciparu, tā var saturēt domu zīmes ('-') un var būt līdz 35 simboliem gara.

settings.py 8.0KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261
  1. #
  2. # Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
  3. #
  4. # Licensed under the Apache License, Version 2.0 (the "License");
  5. # you may not use this file except in compliance with the License.
  6. # You may obtain a copy of the License at
  7. #
  8. # http://www.apache.org/licenses/LICENSE-2.0
  9. #
  10. # Unless required by applicable law or agreed to in writing, software
  11. # distributed under the License is distributed on an "AS IS" BASIS,
  12. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. # See the License for the specific language governing permissions and
  14. # limitations under the License.
  15. #
  16. import os
  17. from datetime import date
  18. from enum import IntEnum, Enum
  19. from api.utils.file_utils import get_project_base_directory
  20. from api.utils.log_utils import LoggerFactory, getLogger
  21. import rag.utils.es_conn
  22. import rag.utils.infinity_conn
  23. # Logger
  24. LoggerFactory.set_directory(
  25. os.path.join(
  26. get_project_base_directory(),
  27. "logs",
  28. "api"))
  29. # {CRITICAL: 50, FATAL:50, ERROR:40, WARNING:30, WARN:30, INFO:20, DEBUG:10, NOTSET:0}
  30. LoggerFactory.LEVEL = 30
  31. stat_logger = getLogger("stat")
  32. access_logger = getLogger("access")
  33. database_logger = getLogger("database")
  34. chat_logger = getLogger("chat")
  35. import rag.utils
  36. from rag.nlp import search
  37. from graphrag import search as kg_search
  38. from api.utils import get_base_config, decrypt_database_config
  39. API_VERSION = "v1"
  40. RAG_FLOW_SERVICE_NAME = "ragflow"
  41. SERVER_MODULE = "rag_flow_server.py"
  42. TEMP_DIRECTORY = os.path.join(get_project_base_directory(), "temp")
  43. RAG_FLOW_CONF_PATH = os.path.join(get_project_base_directory(), "conf")
  44. LIGHTEN = int(os.environ.get('LIGHTEN', "0"))
  45. SUBPROCESS_STD_LOG_NAME = "std.log"
  46. ERROR_REPORT = True
  47. ERROR_REPORT_WITH_PATH = False
  48. MAX_TIMESTAMP_INTERVAL = 60
  49. SESSION_VALID_PERIOD = 7 * 24 * 60 * 60
  50. REQUEST_TRY_TIMES = 3
  51. REQUEST_WAIT_SEC = 2
  52. REQUEST_MAX_WAIT_SEC = 300
  53. USE_REGISTRY = get_base_config("use_registry")
  54. LLM = get_base_config("user_default_llm", {})
  55. LLM_FACTORY = LLM.get("factory", "Tongyi-Qianwen")
  56. LLM_BASE_URL = LLM.get("base_url")
  57. CHAT_MDL = EMBEDDING_MDL = RERANK_MDL = ASR_MDL = IMAGE2TEXT_MDL = ""
  58. if not LIGHTEN:
  59. default_llm = {
  60. "Tongyi-Qianwen": {
  61. "chat_model": "qwen-plus",
  62. "embedding_model": "text-embedding-v2",
  63. "image2text_model": "qwen-vl-max",
  64. "asr_model": "paraformer-realtime-8k-v1",
  65. },
  66. "OpenAI": {
  67. "chat_model": "gpt-3.5-turbo",
  68. "embedding_model": "text-embedding-ada-002",
  69. "image2text_model": "gpt-4-vision-preview",
  70. "asr_model": "whisper-1",
  71. },
  72. "Azure-OpenAI": {
  73. "chat_model": "gpt-35-turbo",
  74. "embedding_model": "text-embedding-ada-002",
  75. "image2text_model": "gpt-4-vision-preview",
  76. "asr_model": "whisper-1",
  77. },
  78. "ZHIPU-AI": {
  79. "chat_model": "glm-3-turbo",
  80. "embedding_model": "embedding-2",
  81. "image2text_model": "glm-4v",
  82. "asr_model": "",
  83. },
  84. "Ollama": {
  85. "chat_model": "qwen-14B-chat",
  86. "embedding_model": "flag-embedding",
  87. "image2text_model": "",
  88. "asr_model": "",
  89. },
  90. "Moonshot": {
  91. "chat_model": "moonshot-v1-8k",
  92. "embedding_model": "",
  93. "image2text_model": "",
  94. "asr_model": "",
  95. },
  96. "DeepSeek": {
  97. "chat_model": "deepseek-chat",
  98. "embedding_model": "",
  99. "image2text_model": "",
  100. "asr_model": "",
  101. },
  102. "VolcEngine": {
  103. "chat_model": "",
  104. "embedding_model": "",
  105. "image2text_model": "",
  106. "asr_model": "",
  107. },
  108. "BAAI": {
  109. "chat_model": "",
  110. "embedding_model": "BAAI/bge-large-zh-v1.5",
  111. "image2text_model": "",
  112. "asr_model": "",
  113. "rerank_model": "BAAI/bge-reranker-v2-m3",
  114. }
  115. }
  116. if LLM_FACTORY:
  117. CHAT_MDL = default_llm[LLM_FACTORY]["chat_model"] + f"@{LLM_FACTORY}"
  118. ASR_MDL = default_llm[LLM_FACTORY]["asr_model"] + f"@{LLM_FACTORY}"
  119. IMAGE2TEXT_MDL = default_llm[LLM_FACTORY]["image2text_model"] + f"@{LLM_FACTORY}"
  120. EMBEDDING_MDL = default_llm["BAAI"]["embedding_model"] + "@BAAI"
  121. RERANK_MDL = default_llm["BAAI"]["rerank_model"] + "@BAAI"
  122. API_KEY = LLM.get("api_key", "")
  123. PARSERS = LLM.get(
  124. "parsers",
  125. "naive:General,qa:Q&A,resume:Resume,manual:Manual,table:Table,paper:Paper,book:Book,laws:Laws,presentation:Presentation,picture:Picture,one:One,audio:Audio,knowledge_graph:Knowledge Graph,email:Email")
  126. # distribution
  127. DEPENDENT_DISTRIBUTION = get_base_config("dependent_distribution", False)
  128. RAG_FLOW_UPDATE_CHECK = False
  129. HOST = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("host", "127.0.0.1")
  130. HTTP_PORT = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("http_port")
  131. SECRET_KEY = get_base_config(
  132. RAG_FLOW_SERVICE_NAME,
  133. {}).get("secret_key", str(date.today()))
  134. TOKEN_EXPIRE_IN = get_base_config(
  135. RAG_FLOW_SERVICE_NAME, {}).get(
  136. "token_expires_in", 3600)
  137. NGINX_HOST = get_base_config(
  138. RAG_FLOW_SERVICE_NAME, {}).get(
  139. "nginx", {}).get("host") or HOST
  140. NGINX_HTTP_PORT = get_base_config(
  141. RAG_FLOW_SERVICE_NAME, {}).get(
  142. "nginx", {}).get("http_port") or HTTP_PORT
  143. RANDOM_INSTANCE_ID = get_base_config(
  144. RAG_FLOW_SERVICE_NAME, {}).get(
  145. "random_instance_id", False)
  146. PROXY = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("proxy")
  147. PROXY_PROTOCOL = get_base_config(RAG_FLOW_SERVICE_NAME, {}).get("protocol")
  148. DATABASE_TYPE = os.getenv("DB_TYPE", 'mysql')
  149. DATABASE = decrypt_database_config(name=DATABASE_TYPE)
  150. # Switch
  151. # upload
  152. UPLOAD_DATA_FROM_CLIENT = True
  153. # authentication
  154. AUTHENTICATION_CONF = get_base_config("authentication", {})
  155. # client
  156. CLIENT_AUTHENTICATION = AUTHENTICATION_CONF.get(
  157. "client", {}).get(
  158. "switch", False)
  159. HTTP_APP_KEY = AUTHENTICATION_CONF.get("client", {}).get("http_app_key")
  160. GITHUB_OAUTH = get_base_config("oauth", {}).get("github")
  161. FEISHU_OAUTH = get_base_config("oauth", {}).get("feishu")
  162. WECHAT_OAUTH = get_base_config("oauth", {}).get("wechat")
  163. # site
  164. SITE_AUTHENTICATION = AUTHENTICATION_CONF.get("site", {}).get("switch", False)
  165. # permission
  166. PERMISSION_CONF = get_base_config("permission", {})
  167. PERMISSION_SWITCH = PERMISSION_CONF.get("switch")
  168. COMPONENT_PERMISSION = PERMISSION_CONF.get("component")
  169. DATASET_PERMISSION = PERMISSION_CONF.get("dataset")
  170. HOOK_MODULE = get_base_config("hook_module")
  171. HOOK_SERVER_NAME = get_base_config("hook_server_name")
  172. ENABLE_MODEL_STORE = get_base_config('enable_model_store', False)
  173. # authentication
  174. USE_AUTHENTICATION = False
  175. USE_DATA_AUTHENTICATION = False
  176. AUTOMATIC_AUTHORIZATION_OUTPUT_DATA = True
  177. USE_DEFAULT_TIMEOUT = False
  178. AUTHENTICATION_DEFAULT_TIMEOUT = 7 * 24 * 60 * 60 # s
  179. PRIVILEGE_COMMAND_WHITELIST = []
  180. CHECK_NODES_IDENTITY = False
  181. if 'username' in get_base_config("es", {}):
  182. docStoreConn = rag.utils.es_conn.ESConnection()
  183. else:
  184. docStoreConn = rag.utils.infinity_conn.InfinityConnection()
  185. retrievaler = search.Dealer(docStoreConn)
  186. kg_retrievaler = kg_search.KGSearch(docStoreConn)
  187. class CustomEnum(Enum):
  188. @classmethod
  189. def valid(cls, value):
  190. try:
  191. cls(value)
  192. return True
  193. except BaseException:
  194. return False
  195. @classmethod
  196. def values(cls):
  197. return [member.value for member in cls.__members__.values()]
  198. @classmethod
  199. def names(cls):
  200. return [member.name for member in cls.__members__.values()]
  201. class PythonDependenceName(CustomEnum):
  202. Rag_Source_Code = "python"
  203. Python_Env = "miniconda"
  204. class ModelStorage(CustomEnum):
  205. REDIS = "redis"
  206. MYSQL = "mysql"
  207. class RetCode(IntEnum, CustomEnum):
  208. SUCCESS = 0
  209. NOT_EFFECTIVE = 10
  210. EXCEPTION_ERROR = 100
  211. ARGUMENT_ERROR = 101
  212. DATA_ERROR = 102
  213. OPERATING_ERROR = 103
  214. CONNECTION_ERROR = 105
  215. RUNNING = 106
  216. PERMISSION_ERROR = 108
  217. AUTHENTICATION_ERROR = 109
  218. UNAUTHORIZED = 401
  219. SERVER_ERROR = 500
  220. FORBIDDEN = 403
  221. NOT_FOUND = 404