| 
                        123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124 | 
                        - import mimetypes
 - import os
 - import platform
 - import re
 - import urllib.parse
 - import warnings
 - from collections.abc import Mapping
 - from typing import Any
 - from uuid import uuid4
 - 
 - import httpx
 - 
 - try:
 -     import magic
 - except ImportError:
 -     if platform.system() == "Windows":
 -         warnings.warn(
 -             "To use python-magic guess MIMETYPE, you need to run `pip install python-magic-bin`", stacklevel=2
 -         )
 -     elif platform.system() == "Darwin":
 -         warnings.warn("To use python-magic guess MIMETYPE, you need to run `brew install libmagic`", stacklevel=2)
 -     elif platform.system() == "Linux":
 -         warnings.warn(
 -             "To use python-magic guess MIMETYPE, you need to run `sudo apt-get install libmagic1`", stacklevel=2
 -         )
 -     else:
 -         warnings.warn("To use python-magic guess MIMETYPE, you need to install `libmagic`", stacklevel=2)
 -     magic = None  # type: ignore
 - 
 - from pydantic import BaseModel
 - 
 - from configs import dify_config
 - 
 - 
 - class FileInfo(BaseModel):
 -     filename: str
 -     extension: str
 -     mimetype: str
 -     size: int
 - 
 - 
 - def guess_file_info_from_response(response: httpx.Response):
 -     url = str(response.url)
 -     # Try to extract filename from URL
 -     parsed_url = urllib.parse.urlparse(url)
 -     url_path = parsed_url.path
 -     filename = os.path.basename(url_path)
 - 
 -     # If filename couldn't be extracted, use Content-Disposition header
 -     if not filename:
 -         content_disposition = response.headers.get("Content-Disposition")
 -         if content_disposition:
 -             filename_match = re.search(r'filename="?(.+)"?', content_disposition)
 -             if filename_match:
 -                 filename = filename_match.group(1)
 - 
 -     # If still no filename, generate a unique one
 -     if not filename:
 -         unique_name = str(uuid4())
 -         filename = f"{unique_name}"
 - 
 -     # Guess MIME type from filename first, then URL
 -     mimetype, _ = mimetypes.guess_type(filename)
 -     if mimetype is None:
 -         mimetype, _ = mimetypes.guess_type(url)
 -     if mimetype is None:
 -         # If guessing fails, use Content-Type from response headers
 -         mimetype = response.headers.get("Content-Type", "application/octet-stream")
 - 
 -     # Use python-magic to guess MIME type if still unknown or generic
 -     if mimetype == "application/octet-stream" and magic is not None:
 -         try:
 -             mimetype = magic.from_buffer(response.content[:1024], mime=True)
 -         except magic.MagicException:
 -             pass
 - 
 -     extension = os.path.splitext(filename)[1]
 - 
 -     # Ensure filename has an extension
 -     if not extension:
 -         extension = mimetypes.guess_extension(mimetype) or ".bin"
 -         filename = f"{filename}{extension}"
 - 
 -     return FileInfo(
 -         filename=filename,
 -         extension=extension,
 -         mimetype=mimetype,
 -         size=int(response.headers.get("Content-Length", -1)),
 -     )
 - 
 - 
 - def get_parameters_from_feature_dict(*, features_dict: Mapping[str, Any], user_input_form: list[dict[str, Any]]):
 -     return {
 -         "opening_statement": features_dict.get("opening_statement"),
 -         "suggested_questions": features_dict.get("suggested_questions", []),
 -         "suggested_questions_after_answer": features_dict.get("suggested_questions_after_answer", {"enabled": False}),
 -         "speech_to_text": features_dict.get("speech_to_text", {"enabled": False}),
 -         "text_to_speech": features_dict.get("text_to_speech", {"enabled": False}),
 -         "retriever_resource": features_dict.get("retriever_resource", {"enabled": False}),
 -         "annotation_reply": features_dict.get("annotation_reply", {"enabled": False}),
 -         "more_like_this": features_dict.get("more_like_this", {"enabled": False}),
 -         "user_input_form": user_input_form,
 -         "sensitive_word_avoidance": features_dict.get(
 -             "sensitive_word_avoidance", {"enabled": False, "type": "", "configs": []}
 -         ),
 -         "file_upload": features_dict.get(
 -             "file_upload",
 -             {
 -                 "image": {
 -                     "enabled": False,
 -                     "number_limits": 3,
 -                     "detail": "high",
 -                     "transfer_methods": ["remote_url", "local_file"],
 -                 }
 -             },
 -         ),
 -         "system_parameters": {
 -             "image_file_size_limit": dify_config.UPLOAD_IMAGE_FILE_SIZE_LIMIT,
 -             "video_file_size_limit": dify_config.UPLOAD_VIDEO_FILE_SIZE_LIMIT,
 -             "audio_file_size_limit": dify_config.UPLOAD_AUDIO_FILE_SIZE_LIMIT,
 -             "file_size_limit": dify_config.UPLOAD_FILE_SIZE_LIMIT,
 -             "workflow_file_upload_limit": dify_config.WORKFLOW_FILE_UPLOAD_LIMIT,
 -         },
 -     }
 
 
  |