Nevar pievienot vairāk kā 25 tēmas Tēmai ir jāsākas ar burtu vai ciparu, tā var saturēt domu zīmes ('-') un var būt līdz 35 simboliem gara.

s3_conn.py 4.1KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136
  1. import logging
  2. import boto3
  3. from botocore.exceptions import ClientError
  4. from botocore.client import Config
  5. import time
  6. from io import BytesIO
  7. from rag.utils import singleton
  8. from rag import settings
  9. @singleton
  10. class RAGFlowS3(object):
  11. def __init__(self):
  12. self.conn = None
  13. self.s3_config = settings.S3
  14. self.endpoint = self.s3_config.get('endpoint', None)
  15. self.access_key = self.s3_config.get('access_key', None)
  16. self.secret_key = self.s3_config.get('secret_key', None)
  17. self.region = self.s3_config.get('region', None)
  18. self.__open__()
  19. def __open__(self):
  20. try:
  21. if self.conn:
  22. self.__close__()
  23. except Exception:
  24. pass
  25. try:
  26. config = Config(
  27. s3={
  28. 'addressing_style': 'virtual'
  29. }
  30. )
  31. self.conn = boto3.client(
  32. 's3',
  33. endpoint_url=self.endpoint,
  34. region_name=self.region,
  35. aws_access_key_id=self.access_key,
  36. aws_secret_access_key=self.secret_key,
  37. config=config
  38. )
  39. except Exception:
  40. logging.exception(
  41. "Fail to connect %s" % self.endpoint)
  42. def __close__(self):
  43. del self.conn
  44. self.conn = None
  45. def bucket_exists(self, bucket):
  46. try:
  47. logging.debug(f"head_bucket bucketname {bucket}")
  48. self.conn.head_bucket(Bucket=bucket)
  49. exists = True
  50. except ClientError:
  51. logging.exception(f"head_bucket error {bucket}")
  52. exists = False
  53. return exists
  54. def health(self):
  55. bucket, fnm, binary = "txtxtxtxt1", "txtxtxtxt1", b"_t@@@1"
  56. if not self.bucket_exists(bucket):
  57. self.conn.create_bucket(Bucket=bucket)
  58. logging.debug(f"create bucket {bucket} ********")
  59. r = self.conn.upload_fileobj(BytesIO(binary), bucket, fnm)
  60. return r
  61. def get_properties(self, bucket, key):
  62. return {}
  63. def list(self, bucket, dir, recursive=True):
  64. return []
  65. def put(self, bucket, fnm, binary):
  66. logging.debug(f"bucket name {bucket}; filename :{fnm}:")
  67. for _ in range(1):
  68. try:
  69. if not self.bucket_exists(bucket):
  70. self.conn.create_bucket(Bucket=bucket)
  71. logging.info(f"create bucket {bucket} ********")
  72. r = self.conn.upload_fileobj(BytesIO(binary), bucket, fnm)
  73. return r
  74. except Exception:
  75. logging.exception(f"Fail put {bucket}/{fnm}")
  76. self.__open__()
  77. time.sleep(1)
  78. def rm(self, bucket, fnm):
  79. try:
  80. self.conn.delete_object(Bucket=bucket, Key=fnm)
  81. except Exception:
  82. logging.exception(f"Fail rm {bucket}/{fnm}")
  83. def get(self, bucket, fnm):
  84. for _ in range(1):
  85. try:
  86. r = self.conn.get_object(Bucket=bucket, Key=fnm)
  87. object_data = r['Body'].read()
  88. return object_data
  89. except Exception:
  90. logging.exception(f"fail get {bucket}/{fnm}")
  91. self.__open__()
  92. time.sleep(1)
  93. return
  94. def obj_exist(self, bucket, fnm):
  95. try:
  96. if self.conn.head_object(Bucket=bucket, Key=fnm):
  97. return True
  98. except ClientError as e:
  99. if e.response['Error']['Code'] == '404':
  100. return False
  101. else:
  102. raise
  103. def get_presigned_url(self, bucket, fnm, expires):
  104. for _ in range(10):
  105. try:
  106. r = self.conn.generate_presigned_url('get_object',
  107. Params={'Bucket': bucket,
  108. 'Key': fnm},
  109. ExpiresIn=expires)
  110. return r
  111. except Exception:
  112. logging.exception(f"fail get url {bucket}/{fnm}")
  113. self.__open__()
  114. time.sleep(1)
  115. return