-
Notifications
You must be signed in to change notification settings - Fork 89
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[Python]: Fix concurrency issues in caching for urllib3<2.0 (#1183)
- Loading branch information
Showing
6 changed files
with
710 additions
and
3 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,86 @@ | ||
# mypy: disable-error-code="import-untyped" | ||
import functools | ||
|
||
import six # noqa | ||
This comment has been minimized.
Sorry, something went wrong. |
||
from urllib3 import __version__ as urllib3version # noqa | ||
from urllib3 import connection # noqa | ||
|
||
|
||
# Copied from https://github.com/urllib3/urllib3/blob/1c994dfc8c5d5ecaee8ed3eb585d4785f5febf6e/src/urllib3/connection.py#L231 | ||
def request(self, method, url, body=None, headers=None): | ||
"""Make the request. | ||
This function is based on the urllib3 request method, with modifications | ||
to handle potential issues when using vcrpy in concurrent workloads. | ||
Args: | ||
self: The HTTPConnection instance. | ||
method (str): The HTTP method (e.g., 'GET', 'POST'). | ||
url (str): The URL for the request. | ||
body (Optional[Any]): The body of the request. | ||
headers (Optional[dict]): Headers to send with the request. | ||
Returns: | ||
The result of calling the parent request method. | ||
""" | ||
# Update the inner socket's timeout value to send the request. | ||
# This only triggers if the connection is re-used. | ||
if getattr(self, "sock", None) is not None: | ||
self.sock.settimeout(self.timeout) | ||
|
||
if headers is None: | ||
headers = {} | ||
else: | ||
# Avoid modifying the headers passed into .request() | ||
headers = headers.copy() | ||
if "user-agent" not in (six.ensure_str(k.lower()) for k in headers): | ||
headers["User-Agent"] = connection._get_default_user_agent() | ||
# The above is all the same ^^^ | ||
# The following is different: | ||
return self._parent_request(method, url, body=body, headers=headers) | ||
|
||
|
||
_PATCHED = False | ||
|
||
|
||
def patch_urllib3(): | ||
"""Patch the request method of urllib3 to avoid type errors when using vcrpy. | ||
In concurrent workloads (such as the tracing background queue), the | ||
connection pool can get in a state where an HTTPConnection is created | ||
before vcrpy patches the HTTPConnection class. In urllib3 >= 2.0 this isn't | ||
a problem since they use the proper super().request(...) syntax, but in older | ||
versions, super(HTTPConnection, self).request is used, resulting in a TypeError | ||
since self is no longer a subclass of "HTTPConnection" (which at this point | ||
is vcr.stubs.VCRConnection). | ||
This method patches the class to fix the super() syntax to avoid mixed inheritance. | ||
In the case of the LangSmith tracing logic, it doesn't really matter since we always | ||
exclude cache checks for calls to LangSmith. | ||
The patch is only applied for urllib3 versions older than 2.0. | ||
""" | ||
global _PATCHED | ||
if _PATCHED: | ||
return | ||
from packaging import version | ||
|
||
if version.parse(urllib3version) >= version.parse("2.0"): | ||
_PATCHED = True | ||
return | ||
|
||
# Lookup the parent class and its request method | ||
parent_class = connection.HTTPConnection.__bases__[0] | ||
parent_request = parent_class.request | ||
|
||
def new_request(self, *args, **kwargs): | ||
"""Handle parent request. | ||
This method binds the parent's request method to self and then | ||
calls our modified request function. | ||
""" | ||
self._parent_request = functools.partial(parent_request, self) | ||
return request(self, *args, **kwargs) | ||
|
||
connection.HTTPConnection.request = new_request | ||
_PATCHED = True |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.
This line breaks langsmith at the moment, add it to pyproject.toml?