ssrf_proxy.py 3.0 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091
  1. """
  2. Proxy requests to avoid SSRF
  3. """
  4. import logging
  5. import time
  6. import httpx
  7. from configs import dify_config
  8. SSRF_DEFAULT_MAX_RETRIES = dify_config.SSRF_DEFAULT_MAX_RETRIES
  9. proxy_mounts = (
  10. {
  11. "http://": httpx.HTTPTransport(proxy=dify_config.SSRF_PROXY_HTTP_URL),
  12. "https://": httpx.HTTPTransport(proxy=dify_config.SSRF_PROXY_HTTPS_URL),
  13. }
  14. if dify_config.SSRF_PROXY_HTTP_URL and dify_config.SSRF_PROXY_HTTPS_URL
  15. else None
  16. )
  17. BACKOFF_FACTOR = 0.5
  18. STATUS_FORCELIST = [429, 500, 502, 503, 504]
  19. def make_request(method, url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  20. if "allow_redirects" in kwargs:
  21. allow_redirects = kwargs.pop("allow_redirects")
  22. if "follow_redirects" not in kwargs:
  23. kwargs["follow_redirects"] = allow_redirects
  24. if "timeout" not in kwargs:
  25. kwargs["timeout"] = httpx.Timeout(
  26. timeout=dify_config.SSRF_DEFAULT_TIME_OUT,
  27. connect=dify_config.SSRF_DEFAULT_CONNECT_TIME_OUT,
  28. read=dify_config.SSRF_DEFAULT_READ_TIME_OUT,
  29. write=dify_config.SSRF_DEFAULT_WRITE_TIME_OUT,
  30. )
  31. retries = 0
  32. while retries <= max_retries:
  33. try:
  34. if dify_config.SSRF_PROXY_ALL_URL:
  35. with httpx.Client(proxy=dify_config.SSRF_PROXY_ALL_URL) as client:
  36. response = client.request(method=method, url=url, **kwargs)
  37. elif proxy_mounts:
  38. with httpx.Client(mounts=proxy_mounts) as client:
  39. response = client.request(method=method, url=url, **kwargs)
  40. else:
  41. with httpx.Client() as client:
  42. response = client.request(method=method, url=url, **kwargs)
  43. if response.status_code not in STATUS_FORCELIST:
  44. return response
  45. else:
  46. logging.warning(f"Received status code {response.status_code} for URL {url} which is in the force list")
  47. except httpx.RequestError as e:
  48. logging.warning(f"Request to URL {url} failed on attempt {retries + 1}: {e}")
  49. retries += 1
  50. if retries <= max_retries:
  51. time.sleep(BACKOFF_FACTOR * (2 ** (retries - 1)))
  52. raise Exception(f"Reached maximum retries ({max_retries}) for URL {url}")
  53. def get(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  54. return make_request("GET", url, max_retries=max_retries, **kwargs)
  55. def post(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  56. return make_request("POST", url, max_retries=max_retries, **kwargs)
  57. def put(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  58. return make_request("PUT", url, max_retries=max_retries, **kwargs)
  59. def patch(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  60. return make_request("PATCH", url, max_retries=max_retries, **kwargs)
  61. def delete(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  62. return make_request("DELETE", url, max_retries=max_retries, **kwargs)
  63. def head(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  64. return make_request("HEAD", url, max_retries=max_retries, **kwargs)