Skip to content

Commit ba2c350

Browse files
committed
ref(wsgi): Update _werkzeug vendor to newer version
Fixes GH-3516
1 parent 5a122b5 commit ba2c350

File tree

2 files changed

+83
-34
lines changed

2 files changed

+83
-34
lines changed

sentry_sdk/_werkzeug.py

Lines changed: 61 additions & 34 deletions
Original file line numberDiff line numberDiff line change
@@ -41,58 +41,85 @@
4141

4242

4343
#
44-
# `get_headers` comes from `werkzeug.datastructures.EnvironHeaders`
45-
# https://github.com/pallets/werkzeug/blob/0.14.1/werkzeug/datastructures.py#L1361
44+
# `get_headers` comes from `werkzeug.datastructures.headers.__iter__`
45+
# https://github.com/pallets/werkzeug/blob/3.1.3/src/werkzeug/datastructures/headers.py#L644
4646
#
4747
# We need this function because Django does not give us a "pure" http header
4848
# dict. So we might as well use it for all WSGI integrations.
4949
#
5050
def _get_headers(environ):
5151
# type: (Dict[str, str]) -> Iterator[Tuple[str, str]]
52-
"""
53-
Returns only proper HTTP headers.
54-
"""
5552
for key, value in environ.items():
56-
key = str(key)
57-
if key.startswith("HTTP_") and key not in (
53+
if key.startswith("HTTP_") and key not in {
5854
"HTTP_CONTENT_TYPE",
5955
"HTTP_CONTENT_LENGTH",
60-
):
56+
}:
6157
yield key[5:].replace("_", "-").title(), value
62-
elif key in ("CONTENT_TYPE", "CONTENT_LENGTH"):
58+
elif key in {"CONTENT_TYPE", "CONTENT_LENGTH"} and value:
6359
yield key.replace("_", "-").title(), value
6460

6561

6662
#
6763
# `get_host` comes from `werkzeug.wsgi.get_host`
68-
# https://github.com/pallets/werkzeug/blob/1.0.1/src/werkzeug/wsgi.py#L145
64+
# https://github.com/pallets/werkzeug/blob/3.1.3/src/werkzeug/wsgi.py#L86
6965
#
7066
def get_host(environ, use_x_forwarded_for=False):
7167
# type: (Dict[str, str], bool) -> str
7268
"""
7369
Return the host for the given WSGI environment.
7470
"""
75-
if use_x_forwarded_for and "HTTP_X_FORWARDED_HOST" in environ:
76-
rv = environ["HTTP_X_FORWARDED_HOST"]
77-
if environ["wsgi.url_scheme"] == "http" and rv.endswith(":80"):
78-
rv = rv[:-3]
79-
elif environ["wsgi.url_scheme"] == "https" and rv.endswith(":443"):
80-
rv = rv[:-4]
81-
elif environ.get("HTTP_HOST"):
82-
rv = environ["HTTP_HOST"]
83-
if environ["wsgi.url_scheme"] == "http" and rv.endswith(":80"):
84-
rv = rv[:-3]
85-
elif environ["wsgi.url_scheme"] == "https" and rv.endswith(":443"):
86-
rv = rv[:-4]
87-
elif environ.get("SERVER_NAME"):
88-
rv = environ["SERVER_NAME"]
89-
if (environ["wsgi.url_scheme"], environ["SERVER_PORT"]) not in (
90-
("https", "443"),
91-
("http", "80"),
92-
):
93-
rv += ":" + environ["SERVER_PORT"]
94-
else:
95-
# In spite of the WSGI spec, SERVER_NAME might not be present.
96-
rv = "unknown"
97-
98-
return rv
71+
return _get_host(
72+
environ["wsgi.url_scheme"],
73+
environ.get("HTTP_HOST"),
74+
_get_server(environ),
75+
)
76+
77+
78+
# `_get_host` comes from `werkzeug.sansio.utils`
79+
# https://github.com/pallets/werkzeug/blob/3.1.3/src/werkzeug/sansio/utils.py#L49
80+
def _get_host(
81+
scheme,
82+
host_header,
83+
server=None,
84+
):
85+
# type: (str, str | None, Tuple[str, int | None] | None) -> str
86+
"""
87+
Return the host for the given parameters.
88+
"""
89+
host = ""
90+
91+
if host_header is not None:
92+
host = host_header
93+
elif server is not None:
94+
host = server[0]
95+
96+
# If SERVER_NAME is IPv6, wrap it in [] to match Host header.
97+
# Check for : because domain or IPv4 can't have that.
98+
if ":" in host and host[0] != "[":
99+
host = f"[{host}]"
100+
101+
if server[1] is not None:
102+
host = f"{host}:{server[1]}" # noqa: E231
103+
104+
if scheme in {"http", "ws"} and host.endswith(":80"):
105+
host = host[:-3]
106+
elif scheme in {"https", "wss"} and host.endswith(":443"):
107+
host = host[:-4]
108+
109+
return host
110+
111+
112+
def _get_server(environ):
113+
# type: (Dict[str, str]) -> Tuple[str, int | None] | None
114+
name = environ.get("SERVER_NAME")
115+
116+
if name is None:
117+
return None
118+
119+
try:
120+
port = int(environ.get("SERVER_PORT", None))
121+
except (TypeError, ValueError):
122+
# unix socket
123+
port = None
124+
125+
return name, port

tests/integrations/wsgi/test_wsgi.py

Lines changed: 22 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -61,6 +61,28 @@ def test_basic(sentry_init, crashing_app, capture_events):
6161
}
6262

6363

64+
def test_basic_forwarded_host(sentry_init, crashing_app, capture_events):
65+
sentry_init(send_default_pii=True)
66+
app = SentryWsgiMiddleware(crashing_app, use_x_forwarded_for=True)
67+
client = Client(app)
68+
events = capture_events()
69+
70+
with pytest.raises(ZeroDivisionError):
71+
client.get("/", environ_overrides={"HTTP_X_FORWARDED_HOST": "localhost:80"})
72+
73+
(event,) = events
74+
75+
assert event["transaction"] == "generic WSGI request"
76+
77+
assert event["request"] == {
78+
"env": {"SERVER_NAME": "localhost", "SERVER_PORT": "80"},
79+
"headers": {"Host": "localhost", "X-Forwarded-Host": "localhost:80"},
80+
"method": "GET",
81+
"query_string": "",
82+
"url": "http://localhost/",
83+
}
84+
85+
6486
@pytest.mark.parametrize("path_info", ("bark/", "/bark/"))
6587
@pytest.mark.parametrize("script_name", ("woof/woof", "woof/woof/"))
6688
def test_script_name_is_respected(

0 commit comments

Comments
 (0)