azure_blob_storage.py 3.3 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182
  1. from collections.abc import Generator
  2. from datetime import UTC, datetime, timedelta
  3. from azure.identity import DefaultAzureCredential
  4. from azure.storage.blob import AccountSasPermissions, BlobServiceClient, ResourceTypes, generate_account_sas
  5. from configs import dify_config
  6. from extensions.ext_redis import redis_client
  7. from extensions.storage.base_storage import BaseStorage
  8. class AzureBlobStorage(BaseStorage):
  9. """Implementation for Azure Blob storage."""
  10. def __init__(self):
  11. super().__init__()
  12. self.bucket_name = dify_config.AZURE_BLOB_CONTAINER_NAME
  13. self.account_url = dify_config.AZURE_BLOB_ACCOUNT_URL
  14. self.account_name = dify_config.AZURE_BLOB_ACCOUNT_NAME
  15. self.account_key = dify_config.AZURE_BLOB_ACCOUNT_KEY
  16. if self.account_key == "managedidentity":
  17. self.credential = DefaultAzureCredential()
  18. else:
  19. self.credential = None
  20. def save(self, filename, data):
  21. client = self._sync_client()
  22. blob_container = client.get_container_client(container=self.bucket_name)
  23. blob_container.upload_blob(filename, data)
  24. def load_once(self, filename: str) -> bytes:
  25. client = self._sync_client()
  26. blob = client.get_container_client(container=self.bucket_name)
  27. blob = blob.get_blob_client(blob=filename)
  28. data: bytes = blob.download_blob().readall()
  29. return data
  30. def load_stream(self, filename: str) -> Generator:
  31. client = self._sync_client()
  32. blob = client.get_blob_client(container=self.bucket_name, blob=filename)
  33. blob_data = blob.download_blob()
  34. yield from blob_data.chunks()
  35. def download(self, filename, target_filepath):
  36. client = self._sync_client()
  37. blob = client.get_blob_client(container=self.bucket_name, blob=filename)
  38. with open(target_filepath, "wb") as my_blob:
  39. blob_data = blob.download_blob()
  40. blob_data.readinto(my_blob)
  41. def exists(self, filename):
  42. client = self._sync_client()
  43. blob = client.get_blob_client(container=self.bucket_name, blob=filename)
  44. return blob.exists()
  45. def delete(self, filename):
  46. client = self._sync_client()
  47. blob_container = client.get_container_client(container=self.bucket_name)
  48. blob_container.delete_blob(filename)
  49. def _sync_client(self):
  50. if self.account_key == "managedidentity":
  51. return BlobServiceClient(account_url=self.account_url, credential=self.credential)
  52. cache_key = "azure_blob_sas_token_{}_{}".format(self.account_name, self.account_key)
  53. cache_result = redis_client.get(cache_key)
  54. if cache_result is not None:
  55. sas_token = cache_result.decode("utf-8")
  56. else:
  57. sas_token = generate_account_sas(
  58. account_name=self.account_name or "",
  59. account_key=self.account_key or "",
  60. resource_types=ResourceTypes(service=True, container=True, object=True),
  61. permission=AccountSasPermissions(read=True, write=True, delete=True, list=True, add=True, create=True),
  62. expiry=datetime.now(UTC).replace(tzinfo=None) + timedelta(hours=1),
  63. )
  64. redis_client.set(cache_key, sas_token, ex=3000)
  65. return BlobServiceClient(account_url=self.account_url or "", credential=sas_token)