Ви не можете вибрати більше 25 тем Теми мають розпочинатися з літери або цифри, можуть містити дефіси (-) і не повинні перевищувати 35 символів.

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136
  1. import logging
  2. import boto3
  3. from botocore.exceptions import ClientError
  4. from botocore.client import Config
  5. import time
  6. from io import BytesIO
  7. from rag.utils import singleton
  8. from rag import settings
  9. @singleton
  10. class RAGFlowS3(object):
  11. def __init__(self):
  12. self.conn = None
  13. self.s3_config = settings.S3
  14. self.endpoint = self.s3_config.get('endpoint', None)
  15. self.access_key = self.s3_config.get('access_key', None)
  16. self.secret_key = self.s3_config.get('secret_key', None)
  17. self.region = self.s3_config.get('region', None)
  18. self.__open__()
  19. def __open__(self):
  20. try:
  21. if self.conn:
  22. self.__close__()
  23. except Exception:
  24. pass
  25. try:
  26. config = Config(
  27. s3={
  28. 'addressing_style': 'virtual'
  29. }
  30. )
  31. self.conn = boto3.client(
  32. 's3',
  33. endpoint_url=self.endpoint,
  34. region_name=self.region,
  35. aws_access_key_id=self.access_key,
  36. aws_secret_access_key=self.secret_key,
  37. config=config
  38. )
  39. except Exception:
  40. logging.exception(
  41. "Fail to connect %s" % self.endpoint)
  42. def __close__(self):
  43. del self.conn
  44. self.conn = None
  45. def bucket_exists(self, bucket):
  46. try:
  47. logging.debug(f"head_bucket bucketname {bucket}")
  48. self.conn.head_bucket(Bucket=bucket)
  49. exists = True
  50. except ClientError:
  51. logging.exception(f"head_bucket error {bucket}")
  52. exists = False
  53. return exists
  54. def health(self):
  55. bucket, fnm, binary = "txtxtxtxt1", "txtxtxtxt1", b"_t@@@1"
  56. if not self.bucket_exists(bucket):
  57. self.conn.create_bucket(Bucket=bucket)
  58. logging.debug(f"create bucket {bucket} ********")
  59. r = self.conn.upload_fileobj(BytesIO(binary), bucket, fnm)
  60. return r
  61. def get_properties(self, bucket, key):
  62. return {}
  63. def list(self, bucket, dir, recursive=True):
  64. return []
  65. def put(self, bucket, fnm, binary):
  66. logging.debug(f"bucket name {bucket}; filename :{fnm}:")
  67. for _ in range(1):
  68. try:
  69. if not self.bucket_exists(bucket):
  70. self.conn.create_bucket(Bucket=bucket)
  71. logging.info(f"create bucket {bucket} ********")
  72. r = self.conn.upload_fileobj(BytesIO(binary), bucket, fnm)
  73. return r
  74. except Exception:
  75. logging.exception(f"Fail put {bucket}/{fnm}")
  76. self.__open__()
  77. time.sleep(1)
  78. def rm(self, bucket, fnm):
  79. try:
  80. self.conn.delete_object(Bucket=bucket, Key=fnm)
  81. except Exception:
  82. logging.exception(f"Fail rm {bucket}/{fnm}")
  83. def get(self, bucket, fnm):
  84. for _ in range(1):
  85. try:
  86. r = self.conn.get_object(Bucket=bucket, Key=fnm)
  87. object_data = r['Body'].read()
  88. return object_data
  89. except Exception:
  90. logging.exception(f"fail get {bucket}/{fnm}")
  91. self.__open__()
  92. time.sleep(1)
  93. return
  94. def obj_exist(self, bucket, fnm):
  95. try:
  96. if self.conn.head_object(Bucket=bucket, Key=fnm):
  97. return True
  98. except ClientError as e:
  99. if e.response['Error']['Code'] == '404':
  100. return False
  101. else:
  102. raise
  103. def get_presigned_url(self, bucket, fnm, expires):
  104. for _ in range(10):
  105. try:
  106. r = self.conn.generate_presigned_url('get_object',
  107. Params={'Bucket': bucket,
  108. 'Key': fnm},
  109. ExpiresIn=expires)
  110. return r
  111. except Exception:
  112. logging.exception(f"fail get url {bucket}/{fnm}")
  113. self.__open__()
  114. time.sleep(1)
  115. return