ssrf_proxy.py 2.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384
  1. """
  2. Proxy requests to avoid SSRF
  3. """
  4. import logging
  5. import os
  6. import time
  7. import httpx
  8. SSRF_PROXY_ALL_URL = os.getenv("SSRF_PROXY_ALL_URL", "")
  9. SSRF_PROXY_HTTP_URL = os.getenv("SSRF_PROXY_HTTP_URL", "")
  10. SSRF_PROXY_HTTPS_URL = os.getenv("SSRF_PROXY_HTTPS_URL", "")
  11. SSRF_DEFAULT_MAX_RETRIES = int(os.getenv("SSRF_DEFAULT_MAX_RETRIES", "3"))
  12. proxy_mounts = (
  13. {
  14. "http://": httpx.HTTPTransport(proxy=SSRF_PROXY_HTTP_URL),
  15. "https://": httpx.HTTPTransport(proxy=SSRF_PROXY_HTTPS_URL),
  16. }
  17. if SSRF_PROXY_HTTP_URL and SSRF_PROXY_HTTPS_URL
  18. else None
  19. )
  20. BACKOFF_FACTOR = 0.5
  21. STATUS_FORCELIST = [429, 500, 502, 503, 504]
  22. def make_request(method, url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  23. if "allow_redirects" in kwargs:
  24. allow_redirects = kwargs.pop("allow_redirects")
  25. if "follow_redirects" not in kwargs:
  26. kwargs["follow_redirects"] = allow_redirects
  27. retries = 0
  28. while retries <= max_retries:
  29. try:
  30. if SSRF_PROXY_ALL_URL:
  31. with httpx.Client(proxy=SSRF_PROXY_ALL_URL) as client:
  32. response = client.request(method=method, url=url, **kwargs)
  33. elif proxy_mounts:
  34. with httpx.Client(mounts=proxy_mounts) as client:
  35. response = client.request(method=method, url=url, **kwargs)
  36. else:
  37. with httpx.Client() as client:
  38. response = client.request(method=method, url=url, **kwargs)
  39. if response.status_code not in STATUS_FORCELIST:
  40. return response
  41. else:
  42. logging.warning(f"Received status code {response.status_code} for URL {url} which is in the force list")
  43. except httpx.RequestError as e:
  44. logging.warning(f"Request to URL {url} failed on attempt {retries + 1}: {e}")
  45. retries += 1
  46. if retries <= max_retries:
  47. time.sleep(BACKOFF_FACTOR * (2 ** (retries - 1)))
  48. raise Exception(f"Reached maximum retries ({max_retries}) for URL {url}")
  49. def get(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  50. return make_request("GET", url, max_retries=max_retries, **kwargs)
  51. def post(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  52. return make_request("POST", url, max_retries=max_retries, **kwargs)
  53. def put(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  54. return make_request("PUT", url, max_retries=max_retries, **kwargs)
  55. def patch(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  56. return make_request("PATCH", url, max_retries=max_retries, **kwargs)
  57. def delete(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  58. return make_request("DELETE", url, max_retries=max_retries, **kwargs)
  59. def head(url, max_retries=SSRF_DEFAULT_MAX_RETRIES, **kwargs):
  60. return make_request("HEAD", url, max_retries=max_retries, **kwargs)