-
Notifications
You must be signed in to change notification settings - Fork 1.1k
PYTHON-5306 - Fix use of public MongoClient attributes before connection #2285
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 6 commits
aa86a3a
c185c95
763e78c
66b7e8d
5f7f84a
ed3dea5
99802be
14bb119
c1e6684
2a63a3b
835e560
e5e6dc8
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -109,6 +109,7 @@ | |
) | ||
from pymongo.read_preferences import ReadPreference, _ServerMode | ||
from pymongo.results import ClientBulkWriteResult | ||
from pymongo.server_description import ServerDescription | ||
from pymongo.server_selectors import writable_server_selector | ||
from pymongo.server_type import SERVER_TYPE | ||
from pymongo.topology_description import TOPOLOGY_TYPE, TopologyDescription | ||
|
@@ -767,6 +768,7 @@ def __init__( | |
self._timeout: float | None = None | ||
self._topology_settings: TopologySettings = None # type: ignore[assignment] | ||
self._event_listeners: _EventListeners | None = None | ||
self._initial_topology_id: Optional[ObjectId] = None | ||
|
||
# _pool_class, _monitor_class, and _condition_class are for deep | ||
# customization of PyMongo, e.g. Motor. | ||
|
@@ -779,7 +781,7 @@ def __init__( | |
keyword_opts["document_class"] = doc_class | ||
self._resolve_srv_info: dict[str, Any] = {"keyword_opts": keyword_opts} | ||
|
||
seeds = set() | ||
self._seeds = set() | ||
is_srv = False | ||
username = None | ||
password = None | ||
|
@@ -804,18 +806,18 @@ def __init__( | |
srv_max_hosts=srv_max_hosts, | ||
) | ||
is_srv = entity.startswith(SRV_SCHEME) | ||
seeds.update(res["nodelist"]) | ||
self._seeds.update(res["nodelist"]) | ||
username = res["username"] or username | ||
password = res["password"] or password | ||
dbase = res["database"] or dbase | ||
opts = res["options"] | ||
fqdn = res["fqdn"] | ||
else: | ||
seeds.update(split_hosts(entity, self._port)) | ||
if not seeds: | ||
self._seeds.update(split_hosts(entity, self._port)) | ||
if not self._seeds: | ||
raise ConfigurationError("need to specify at least one host") | ||
|
||
for hostname in [node[0] for node in seeds]: | ||
for hostname in [node[0] for node in self._seeds]: | ||
if _detect_external_db(hostname): | ||
break | ||
|
||
|
@@ -838,7 +840,7 @@ def __init__( | |
srv_service_name = opts.get("srvServiceName", common.SRV_SERVICE_NAME) | ||
|
||
srv_max_hosts = srv_max_hosts or opts.get("srvmaxhosts") | ||
opts = self._normalize_and_validate_options(opts, seeds) | ||
opts = self._normalize_and_validate_options(opts, self._seeds) | ||
|
||
# Username and password passed as kwargs override user info in URI. | ||
username = opts.get("username", username) | ||
|
@@ -857,7 +859,7 @@ def __init__( | |
"username": username, | ||
"password": password, | ||
"dbase": dbase, | ||
"seeds": seeds, | ||
"seeds": self._seeds, | ||
"fqdn": fqdn, | ||
"srv_service_name": srv_service_name, | ||
"pool_class": pool_class, | ||
|
@@ -874,7 +876,7 @@ def __init__( | |
) | ||
|
||
if not is_srv: | ||
self._init_based_on_options(seeds, srv_max_hosts, srv_service_name) | ||
self._init_based_on_options(self._seeds, srv_max_hosts, srv_service_name) | ||
|
||
self._opened = False | ||
self._closed = False | ||
|
@@ -975,6 +977,7 @@ def _init_based_on_options( | |
srv_service_name=srv_service_name, | ||
srv_max_hosts=srv_max_hosts, | ||
server_monitoring_mode=self._options.server_monitoring_mode, | ||
topology_id=self._initial_topology_id, | ||
) | ||
if self._options.auto_encryption_opts: | ||
from pymongo.asynchronous.encryption import _Encrypter | ||
|
@@ -1205,6 +1208,18 @@ def topology_description(self) -> TopologyDescription: | |
|
||
.. versionadded:: 4.0 | ||
""" | ||
if self._topology is None: | ||
servers = {(host, port): ServerDescription((host, port)) for host, port in self._seeds} | ||
td = TopologyDescription( | ||
TOPOLOGY_TYPE.Unknown, | ||
servers, | ||
None, | ||
None, | ||
None, | ||
TopologySettings(), | ||
) | ||
self._initial_topology_id = td._topology_settings._topology_id | ||
return td | ||
return self._topology.description | ||
|
||
@property | ||
|
@@ -1218,6 +1233,8 @@ def nodes(self) -> FrozenSet[_Address]: | |
to any servers, or a network partition causes it to lose connection | ||
to all servers. | ||
""" | ||
if self._topology is None: | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. As the docstring defines, we expect |
||
return frozenset() | ||
description = self._topology.description | ||
return frozenset(s.address for s in description.known_servers) | ||
|
||
|
@@ -1576,6 +1593,8 @@ async def address(self) -> Optional[tuple[str, int]]: | |
|
||
.. versionadded:: 3.0 | ||
""" | ||
if self._topology is None: | ||
await self._get_topology() | ||
topology_type = self._topology._description.topology_type | ||
if ( | ||
topology_type == TOPOLOGY_TYPE.Sharded | ||
|
@@ -1598,6 +1617,8 @@ async def primary(self) -> Optional[tuple[str, int]]: | |
.. versionadded:: 3.0 | ||
AsyncMongoClient gained this property in version 3.0. | ||
""" | ||
if self._topology is None: | ||
await self._get_topology() | ||
return await self._topology.get_primary() # type: ignore[return-value] | ||
|
||
@property | ||
|
@@ -1611,6 +1632,8 @@ async def secondaries(self) -> set[_Address]: | |
.. versionadded:: 3.0 | ||
AsyncMongoClient gained this property in version 3.0. | ||
""" | ||
if self._topology is None: | ||
await self._get_topology() | ||
return await self._topology.get_secondaries() | ||
|
||
@property | ||
|
@@ -1621,6 +1644,8 @@ async def arbiters(self) -> set[_Address]: | |
connected to a replica set, there are no arbiters, or this client was | ||
created without the `replicaSet` option. | ||
""" | ||
if self._topology is None: | ||
await self._get_topology() | ||
return await self._topology.get_arbiters() | ||
|
||
@property | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -101,6 +101,7 @@ | |
) | ||
from pymongo.read_preferences import ReadPreference, _ServerMode | ||
from pymongo.results import ClientBulkWriteResult | ||
from pymongo.server_description import ServerDescription | ||
from pymongo.server_selectors import writable_server_selector | ||
from pymongo.server_type import SERVER_TYPE | ||
from pymongo.synchronous import client_session, database, uri_parser | ||
|
@@ -765,6 +766,7 @@ def __init__( | |
self._timeout: float | None = None | ||
self._topology_settings: TopologySettings = None # type: ignore[assignment] | ||
self._event_listeners: _EventListeners | None = None | ||
self._initial_topology_id: Optional[ObjectId] = None | ||
|
||
# _pool_class, _monitor_class, and _condition_class are for deep | ||
# customization of PyMongo, e.g. Motor. | ||
|
@@ -777,7 +779,7 @@ def __init__( | |
keyword_opts["document_class"] = doc_class | ||
self._resolve_srv_info: dict[str, Any] = {"keyword_opts": keyword_opts} | ||
|
||
seeds = set() | ||
self._seeds = set() | ||
is_srv = False | ||
username = None | ||
password = None | ||
|
@@ -802,18 +804,18 @@ def __init__( | |
srv_max_hosts=srv_max_hosts, | ||
) | ||
is_srv = entity.startswith(SRV_SCHEME) | ||
seeds.update(res["nodelist"]) | ||
self._seeds.update(res["nodelist"]) | ||
username = res["username"] or username | ||
password = res["password"] or password | ||
dbase = res["database"] or dbase | ||
opts = res["options"] | ||
fqdn = res["fqdn"] | ||
else: | ||
seeds.update(split_hosts(entity, self._port)) | ||
if not seeds: | ||
self._seeds.update(split_hosts(entity, self._port)) | ||
if not self._seeds: | ||
raise ConfigurationError("need to specify at least one host") | ||
|
||
for hostname in [node[0] for node in seeds]: | ||
for hostname in [node[0] for node in self._seeds]: | ||
if _detect_external_db(hostname): | ||
break | ||
|
||
|
@@ -836,7 +838,7 @@ def __init__( | |
srv_service_name = opts.get("srvServiceName", common.SRV_SERVICE_NAME) | ||
|
||
srv_max_hosts = srv_max_hosts or opts.get("srvmaxhosts") | ||
opts = self._normalize_and_validate_options(opts, seeds) | ||
opts = self._normalize_and_validate_options(opts, self._seeds) | ||
|
||
# Username and password passed as kwargs override user info in URI. | ||
username = opts.get("username", username) | ||
|
@@ -855,7 +857,7 @@ def __init__( | |
"username": username, | ||
"password": password, | ||
"dbase": dbase, | ||
"seeds": seeds, | ||
"seeds": self._seeds, | ||
"fqdn": fqdn, | ||
"srv_service_name": srv_service_name, | ||
"pool_class": pool_class, | ||
|
@@ -872,7 +874,7 @@ def __init__( | |
) | ||
|
||
if not is_srv: | ||
self._init_based_on_options(seeds, srv_max_hosts, srv_service_name) | ||
self._init_based_on_options(self._seeds, srv_max_hosts, srv_service_name) | ||
|
||
self._opened = False | ||
self._closed = False | ||
|
@@ -973,6 +975,7 @@ def _init_based_on_options( | |
srv_service_name=srv_service_name, | ||
srv_max_hosts=srv_max_hosts, | ||
server_monitoring_mode=self._options.server_monitoring_mode, | ||
topology_id=self._initial_topology_id, | ||
) | ||
if self._options.auto_encryption_opts: | ||
from pymongo.synchronous.encryption import _Encrypter | ||
|
@@ -1203,6 +1206,18 @@ def topology_description(self) -> TopologyDescription: | |
|
||
.. versionadded:: 4.0 | ||
""" | ||
if self._topology is None: | ||
servers = {(host, port): ServerDescription((host, port)) for host, port in self._seeds} | ||
td = TopologyDescription( | ||
TOPOLOGY_TYPE.Unknown, | ||
servers, | ||
None, | ||
None, | ||
None, | ||
TopologySettings(), | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. This is missing certain settings that are publicly accessible, like TopologyDescription.heartbeat_frequency. In the ticket I suggested making the MongoClient constructor always create the Topology instance, and then mutate it later once the SRV info is resolved. Did you consider that approach? It would avoid the problem of attempting to mock out these attributes and avoid the type-ignores since everything would always be non-None. (It could be that this approach is a better fit, I just want to know if an alternative was considered.) There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I started with the approach you suggested, but switched to the current implementation for a few reasons:
This approach has fewer changes that could cause errors, especially since it isolates changes to resolving the specific issue at hand. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Thanks, could you update There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Like I said above, There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. For example: >>> client = MongoClient(..., connect=False, heartbeatFrequencyMS=99999)
>>> client.topology_description.heartbeat_frequency
10
>>> client.admin.command("ping")
...
>>> client.topology_description.heartbeat_frequency
99.999 There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Sorry, I misunderstood what you meant. The example makes it clear, thanks! There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Now we always initialize a |
||
) | ||
self._initial_topology_id = td._topology_settings._topology_id | ||
return td | ||
return self._topology.description | ||
|
||
@property | ||
|
@@ -1216,6 +1231,8 @@ def nodes(self) -> FrozenSet[_Address]: | |
to any servers, or a network partition causes it to lose connection | ||
to all servers. | ||
""" | ||
if self._topology is None: | ||
return frozenset() | ||
description = self._topology.description | ||
return frozenset(s.address for s in description.known_servers) | ||
|
||
|
@@ -1570,6 +1587,8 @@ def address(self) -> Optional[tuple[str, int]]: | |
|
||
.. versionadded:: 3.0 | ||
""" | ||
if self._topology is None: | ||
self._get_topology() | ||
topology_type = self._topology._description.topology_type | ||
if ( | ||
topology_type == TOPOLOGY_TYPE.Sharded | ||
|
@@ -1592,6 +1611,8 @@ def primary(self) -> Optional[tuple[str, int]]: | |
.. versionadded:: 3.0 | ||
MongoClient gained this property in version 3.0. | ||
""" | ||
if self._topology is None: | ||
self._get_topology() | ||
return self._topology.get_primary() # type: ignore[return-value] | ||
|
||
@property | ||
|
@@ -1605,6 +1626,8 @@ def secondaries(self) -> set[_Address]: | |
.. versionadded:: 3.0 | ||
MongoClient gained this property in version 3.0. | ||
""" | ||
if self._topology is None: | ||
self._get_topology() | ||
return self._topology.get_secondaries() | ||
|
||
@property | ||
|
@@ -1615,6 +1638,8 @@ def arbiters(self) -> set[_Address]: | |
connected to a replica set, there are no arbiters, or this client was | ||
created without the `replicaSet` option. | ||
""" | ||
if self._topology is None: | ||
self._get_topology() | ||
return self._topology.get_arbiters() | ||
|
||
@property | ||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -849,6 +849,54 @@ async def test_init_disconnected_with_auth(self): | |
with self.assertRaises(ConnectionFailure): | ||
await c.pymongo_test.test.find_one() | ||
|
||
@async_client_context.require_replica_set | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I believe we can remove require_replica_set. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Removing it causes failures on any non-replica topology: https://spruce.mongodb.com/task/mongo_python_driver_mongodb_latest_test_python3.9_auth_ssl_standalone_cov_patch_846b1fc25ced5979ade934bb27d6ffbb60f68267_68010865cc419c000710589f_25_04_17_13_56_05?execution=0&sortBy=STATUS&sortDir=ASC I assume this is due to SRV requiring SSL + replica to function. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Oh I see. "mongodb+srv://test1.test.build.10gen.cc" returns 2 hosts so it can't connect to standalone. It can connect to Mongos though so we should run this test on both replica set and sharded. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Load balancers probably dont work here so it would need to be |
||
@async_client_context.require_tls | ||
async def test_init_disconnected_with_srv(self): | ||
c = await self.async_rs_or_single_client( | ||
"mongodb+srv://test1.test.build.10gen.cc", connect=False, tlsInsecure=True | ||
) | ||
# nodes returns an empty set if not connected | ||
self.assertEqual(c.nodes, frozenset()) | ||
# topology_description returns the initial seed description if not connected | ||
topology_description = c.topology_description | ||
self.assertEqual(topology_description.topology_type, TOPOLOGY_TYPE.Unknown) | ||
self.assertEqual( | ||
{ | ||
("test1.test.build.10gen.cc", None): ServerDescription( | ||
("test1.test.build.10gen.cc", None) | ||
) | ||
}, | ||
topology_description.server_descriptions(), | ||
) | ||
|
||
# address causes client to block until connected | ||
self.assertIsNotNone(await c.address) | ||
# Initial seed topology and connected topology have the same ID | ||
self.assertEqual( | ||
c._topology._topology_id, topology_description._topology_settings._topology_id | ||
) | ||
|
||
c = await self.async_rs_or_single_client( | ||
"mongodb+srv://test1.test.build.10gen.cc", connect=False, tlsInsecure=True | ||
) | ||
# primary causes client to block until connected | ||
await c.primary | ||
self.assertIsNotNone(c._topology) | ||
|
||
c = await self.async_rs_or_single_client( | ||
"mongodb+srv://test1.test.build.10gen.cc", connect=False, tlsInsecure=True | ||
) | ||
# secondaries causes client to block until connected | ||
await c.secondaries | ||
self.assertIsNotNone(c._topology) | ||
|
||
c = await self.async_rs_or_single_client( | ||
"mongodb+srv://test1.test.build.10gen.cc", connect=False, tlsInsecure=True | ||
) | ||
# arbiters causes client to block until connected | ||
await c.arbiters | ||
self.assertIsNotNone(c._topology) | ||
|
||
async def test_equality(self): | ||
seed = "{}:{}".format(*list(self.client._topology_settings.seeds)[0]) | ||
c = await self.async_rs_or_single_client(seed, connect=False) | ||
|
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
If the client has not connected yet, return a
TopologyDescription
with placeholder servers derived from the seeds passed to the client's constructor.There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
We should make sure the returned TopologyDescription has the same _topology_id. Otherwise it could be confusing because _topology_id will change.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Also can you give an example of what topology_description looks like in the connect=False srv case?
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
<TopologyDescription id: 67ffb68a6e12ca176991f521, topology_type: Unknown, servers: [<ServerDescription (('test1.test.build.10gen.cc', None), 27017) server_type: Unknown, rtt: None>]>
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Please include an example of this new/old behavior in the Jira ticket when closing.