|
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144 |
- import urllib.parse
-
- import httpx
- from flask_restx import marshal_with, reqparse
-
- import services
- from controllers.common import helpers
- from controllers.common.errors import (
- FileTooLargeError,
- RemoteFileUploadError,
- UnsupportedFileTypeError,
- )
- from controllers.web import web_ns
- from controllers.web.wraps import WebApiResource
- from core.file import helpers as file_helpers
- from core.helper import ssrf_proxy
- from extensions.ext_database import db
- from fields.file_fields import build_file_with_signed_url_model, build_remote_file_info_model
- from services.file_service import FileService
-
-
- @web_ns.route("/remote-files/<path:url>")
- class RemoteFileInfoApi(WebApiResource):
- @web_ns.doc("get_remote_file_info")
- @web_ns.doc(description="Get information about a remote file")
- @web_ns.doc(
- responses={
- 200: "Remote file information retrieved successfully",
- 400: "Bad request - invalid URL",
- 404: "Remote file not found",
- 500: "Failed to fetch remote file",
- }
- )
- @marshal_with(build_remote_file_info_model(web_ns))
- def get(self, app_model, end_user, url):
- """Get information about a remote file.
-
- Retrieves basic information about a file located at a remote URL,
- including content type and content length.
-
- Args:
- app_model: The associated application model
- end_user: The end user making the request
- url: URL-encoded path to the remote file
-
- Returns:
- dict: Remote file information including type and length
-
- Raises:
- HTTPException: If the remote file cannot be accessed
- """
- decoded_url = urllib.parse.unquote(url)
- resp = ssrf_proxy.head(decoded_url)
- if resp.status_code != httpx.codes.OK:
- # failed back to get method
- resp = ssrf_proxy.get(decoded_url, timeout=3)
- resp.raise_for_status()
- return {
- "file_type": resp.headers.get("Content-Type", "application/octet-stream"),
- "file_length": int(resp.headers.get("Content-Length", -1)),
- }
-
-
- @web_ns.route("/remote-files/upload")
- class RemoteFileUploadApi(WebApiResource):
- @web_ns.doc("upload_remote_file")
- @web_ns.doc(description="Upload a file from a remote URL")
- @web_ns.doc(
- responses={
- 201: "Remote file uploaded successfully",
- 400: "Bad request - invalid URL or parameters",
- 413: "File too large",
- 415: "Unsupported file type",
- 500: "Failed to fetch remote file",
- }
- )
- @marshal_with(build_file_with_signed_url_model(web_ns))
- def post(self, app_model, end_user):
- """Upload a file from a remote URL.
-
- Downloads a file from the provided remote URL and uploads it
- to the platform storage for use in web applications.
-
- Args:
- app_model: The associated application model
- end_user: The end user making the request
-
- JSON Parameters:
- url: The remote URL to download the file from (required)
-
- Returns:
- dict: File information including ID, signed URL, and metadata
- int: HTTP status code 201 for success
-
- Raises:
- RemoteFileUploadError: Failed to fetch file from remote URL
- FileTooLargeError: File exceeds size limit
- UnsupportedFileTypeError: File type not supported
- """
- parser = reqparse.RequestParser()
- parser.add_argument("url", type=str, required=True, help="URL is required")
- args = parser.parse_args()
-
- url = args["url"]
-
- try:
- resp = ssrf_proxy.head(url=url)
- if resp.status_code != httpx.codes.OK:
- resp = ssrf_proxy.get(url=url, timeout=3, follow_redirects=True)
- if resp.status_code != httpx.codes.OK:
- raise RemoteFileUploadError(f"Failed to fetch file from {url}: {resp.text}")
- except httpx.RequestError as e:
- raise RemoteFileUploadError(f"Failed to fetch file from {url}: {str(e)}")
-
- file_info = helpers.guess_file_info_from_response(resp)
-
- if not FileService.is_file_size_within_limit(extension=file_info.extension, file_size=file_info.size):
- raise FileTooLargeError
-
- content = resp.content if resp.request.method == "GET" else ssrf_proxy.get(url).content
-
- try:
- upload_file = FileService(db.engine).upload_file(
- filename=file_info.filename,
- content=content,
- mimetype=file_info.mimetype,
- user=end_user,
- source_url=url,
- )
- except services.errors.file.FileTooLargeError as file_too_large_error:
- raise FileTooLargeError(file_too_large_error.description)
- except services.errors.file.UnsupportedFileTypeError:
- raise UnsupportedFileTypeError
-
- return {
- "id": upload_file.id,
- "name": upload_file.name,
- "size": upload_file.size,
- "extension": upload_file.extension,
- "url": file_helpers.get_signed_file_url(upload_file_id=upload_file.id),
- "mime_type": upload_file.mime_type,
- "created_by": upload_file.created_by,
- "created_at": upload_file.created_at,
- }, 201
|