remote_files.py 3.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081
  1. import urllib.parse
  2. import httpx
  3. from flask_restful import marshal_with, reqparse # type: ignore
  4. import services
  5. from controllers.common import helpers
  6. from controllers.common.errors import RemoteFileUploadError
  7. from controllers.web.wraps import WebApiResource
  8. from core.file import helpers as file_helpers
  9. from core.helper import ssrf_proxy
  10. from fields.file_fields import file_fields_with_signed_url, remote_file_info_fields
  11. from services.file_service import FileService
  12. from .error import FileTooLargeError, UnsupportedFileTypeError
  13. class RemoteFileInfoApi(WebApiResource):
  14. @marshal_with(remote_file_info_fields)
  15. def get(self, app_model, end_user, url):
  16. decoded_url = urllib.parse.unquote(url)
  17. resp = ssrf_proxy.head(decoded_url)
  18. if resp.status_code != httpx.codes.OK:
  19. # failed back to get method
  20. resp = ssrf_proxy.get(decoded_url, timeout=3)
  21. resp.raise_for_status()
  22. return {
  23. "file_type": resp.headers.get("Content-Type", "application/octet-stream"),
  24. "file_length": int(resp.headers.get("Content-Length", -1)),
  25. }
  26. class RemoteFileUploadApi(WebApiResource):
  27. @marshal_with(file_fields_with_signed_url)
  28. def post(self, app_model, end_user): # Add app_model and end_user parameters
  29. parser = reqparse.RequestParser()
  30. parser.add_argument("url", type=str, required=True, help="URL is required")
  31. args = parser.parse_args()
  32. url = args["url"]
  33. try:
  34. resp = ssrf_proxy.head(url=url)
  35. if resp.status_code != httpx.codes.OK:
  36. resp = ssrf_proxy.get(url=url, timeout=3, follow_redirects=True)
  37. if resp.status_code != httpx.codes.OK:
  38. raise RemoteFileUploadError(f"Failed to fetch file from {url}: {resp.text}")
  39. except httpx.RequestError as e:
  40. raise RemoteFileUploadError(f"Failed to fetch file from {url}: {str(e)}")
  41. file_info = helpers.guess_file_info_from_response(resp)
  42. if not FileService.is_file_size_within_limit(extension=file_info.extension, file_size=file_info.size):
  43. raise FileTooLargeError
  44. content = resp.content if resp.request.method == "GET" else ssrf_proxy.get(url).content
  45. try:
  46. upload_file = FileService.upload_file(
  47. filename=file_info.filename,
  48. content=content,
  49. mimetype=file_info.mimetype,
  50. user=end_user,
  51. source_url=url,
  52. )
  53. except services.errors.file.FileTooLargeError as file_too_large_error:
  54. raise FileTooLargeError(file_too_large_error.description)
  55. except services.errors.file.UnsupportedFileTypeError:
  56. raise UnsupportedFileTypeError
  57. return {
  58. "id": upload_file.id,
  59. "name": upload_file.name,
  60. "size": upload_file.size,
  61. "extension": upload_file.extension,
  62. "url": file_helpers.get_signed_file_url(upload_file_id=upload_file.id),
  63. "mime_type": upload_file.mime_type,
  64. "created_by": upload_file.created_by,
  65. "created_at": upload_file.created_at,
  66. }, 201