| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106 | """Proxy requests to avoid SSRF"""import loggingimport timeimport httpxfrom configs import dify_configSSRF_DEFAULT_MAX_RETRIES = dify_config.SSRF_DEFAULT_MAX_RETRIESHTTP_REQUEST_NODE_SSL_VERIFY = True  # Default value for HTTP_REQUEST_NODE_SSL_VERIFY is Truetry:    HTTP_REQUEST_NODE_SSL_VERIFY = dify_config.HTTP_REQUEST_NODE_SSL_VERIFY    http_request_node_ssl_verify_lower = str(HTTP_REQUEST_NODE_SSL_VERIFY).lower()    if http_request_node_ssl_verify_lower == "true":        HTTP_REQUEST_NODE_SSL_VERIFY = True    elif http_request_node_ssl_verify_lower == "false":        HTTP_REQUEST_NODE_SSL_VERIFY = False    else:        raise ValueError("Invalid value. HTTP_REQUEST_NODE_SSL_VERIFY should be 'True' or 'False'")except NameError:    HTTP_REQUEST_NODE_SSL_VERIFY = TrueBACKOFF_FACTOR = 0.5STATUS_FORCELIST = [429, 500, 502, 503, 504]class MaxRetriesExceededError(ValueError):    """Raised when the maximum number of retries is exceeded."""    passdef make_request(method, url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):    if "allow_redirects" in kwargs:        allow_redirects = kwargs.pop("allow_redirects")        if "follow_redirects" not in kwargs:            kwargs["follow_redirects"] = allow_redirects    if "timeout" not in kwargs:        kwargs["timeout"] = httpx.Timeout(            timeout=dify_config.SSRF_DEFAULT_TIME_OUT,            connect=dify_config.SSRF_DEFAULT_CONNECT_TIME_OUT,            read=dify_config.SSRF_DEFAULT_READ_TIME_OUT,            write=dify_config.SSRF_DEFAULT_WRITE_TIME_OUT,        )    retries = 0    while retries <= max_retries:        try:            if dify_config.SSRF_PROXY_ALL_URL:                with httpx.Client(proxy=dify_config.SSRF_PROXY_ALL_URL, verify=HTTP_REQUEST_NODE_SSL_VERIFY) as client:                    response = client.request(method=method, url=url, **kwargs)            elif dify_config.SSRF_PROXY_HTTP_URL and dify_config.SSRF_PROXY_HTTPS_URL:                proxy_mounts = {                    "http://": httpx.HTTPTransport(proxy=dify_config.SSRF_PROXY_HTTP_URL),                    "https://": httpx.HTTPTransport(proxy=dify_config.SSRF_PROXY_HTTPS_URL),                }                with httpx.Client(mounts=proxy_mounts, verify=HTTP_REQUEST_NODE_SSL_VERIFY) as client:                    response = client.request(method=method, url=url, **kwargs)            else:                with httpx.Client(verify=HTTP_REQUEST_NODE_SSL_VERIFY) as client:                    response = client.request(method=method, url=url, **kwargs)            if response.status_code not in STATUS_FORCELIST:                return response            else:                logging.warning(f"Received status code {response.status_code} for URL {url} which is in the force list")        except httpx.RequestError as e:            logging.warning(f"Request to URL {url} failed on attempt {retries + 1}: {e}")            if max_retries == 0:                raise        retries += 1        if retries <= max_retries:            time.sleep(BACKOFF_FACTOR * (2 ** (retries - 1)))    raise MaxRetriesExceededError(f"Reached maximum retries ({max_retries}) for URL {url}")def get(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):    return make_request("GET", url, max_retries=max_retries, **kwargs)def post(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):    return make_request("POST", url, max_retries=max_retries, **kwargs)def put(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):    return make_request("PUT", url, max_retries=max_retries, **kwargs)def patch(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):    return make_request("PATCH", url, max_retries=max_retries, **kwargs)def delete(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):    return make_request("DELETE", url, max_retries=max_retries, **kwargs)def head(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):    return make_request("HEAD", url, max_retries=max_retries, **kwargs)
 |