# Copyright 2016 MongoDB, Inc. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. """Run the sdam monitoring spec tests.""" import json import os import sys import time sys.path[0:0] = [""] from test import IntegrationTest, client_context, client_knobs, unittest from test.utils import ( ServerAndTopologyEventListener, rs_or_single_client, server_name_to_type, wait_until, ) from bson.json_util import object_hook from pymongo import MongoClient, monitoring from pymongo.collection import Collection from pymongo.common import clean_node from pymongo.errors import ConnectionFailure, NotPrimaryError from pymongo.hello import Hello from pymongo.monitor import Monitor from pymongo.server_description import ServerDescription from pymongo.topology_description import TOPOLOGY_TYPE # Location of JSON test specifications. _TEST_PATH = os.path.join(os.path.dirname(os.path.realpath(__file__)), "sdam_monitoring") def compare_server_descriptions(expected, actual): if (not expected["address"] == "%s:%s" % actual.address) or ( not server_name_to_type(expected["type"]) == actual.server_type ): return False expected_hosts = set(expected["arbiters"] + expected["passives"] + expected["hosts"]) return expected_hosts == set("%s:%s" % s for s in actual.all_hosts) def compare_topology_descriptions(expected, actual): if not (TOPOLOGY_TYPE.__getattribute__(expected["topologyType"]) == actual.topology_type): return False expected = expected["servers"] actual = actual.server_descriptions() if len(expected) != len(actual): return False for exp_server in expected: for address, actual_server in actual.items(): if compare_server_descriptions(exp_server, actual_server): break else: return False return True def compare_events(expected_dict, actual): if not expected_dict: return False, "Error: Bad expected value in YAML test" if not actual: return False, "Error: Event published was None" expected_type, expected = list(expected_dict.items())[0] if expected_type == "server_opening_event": if not isinstance(actual, monitoring.ServerOpeningEvent): return False, "Expected ServerOpeningEvent, got %s" % (actual.__class__) if not expected["address"] == "%s:%s" % actual.server_address: return ( False, "ServerOpeningEvent published with wrong address (expected" " %s, got %s" % (expected["address"], actual.server_address), ) elif expected_type == "server_description_changed_event": if not isinstance(actual, monitoring.ServerDescriptionChangedEvent): return (False, "Expected ServerDescriptionChangedEvent, got %s" % (actual.__class__)) if not expected["address"] == "%s:%s" % actual.server_address: return ( False, "ServerDescriptionChangedEvent has wrong address" " (expected %s, got %s" % (expected["address"], actual.server_address), ) if not compare_server_descriptions(expected["newDescription"], actual.new_description): return (False, "New ServerDescription incorrect in ServerDescriptionChangedEvent") if not compare_server_descriptions( expected["previousDescription"], actual.previous_description ): return ( False, "Previous ServerDescription incorrect in ServerDescriptionChangedEvent", ) elif expected_type == "server_closed_event": if not isinstance(actual, monitoring.ServerClosedEvent): return False, "Expected ServerClosedEvent, got %s" % (actual.__class__) if not expected["address"] == "%s:%s" % actual.server_address: return ( False, "ServerClosedEvent published with wrong address" " (expected %s, got %s" % (expected["address"], actual.server_address), ) elif expected_type == "topology_opening_event": if not isinstance(actual, monitoring.TopologyOpenedEvent): return False, "Expected TopologyOpeningEvent, got %s" % (actual.__class__) elif expected_type == "topology_description_changed_event": if not isinstance(actual, monitoring.TopologyDescriptionChangedEvent): return ( False, "Expected TopologyDescriptionChangedEvent, got %s" % (actual.__class__), ) if not compare_topology_descriptions(expected["newDescription"], actual.new_description): return ( False, "New TopologyDescription incorrect in TopologyDescriptionChangedEvent", ) if not compare_topology_descriptions( expected["previousDescription"], actual.previous_description ): return ( False, "Previous TopologyDescription incorrect in TopologyDescriptionChangedEvent", ) elif expected_type == "topology_closed_event": if not isinstance(actual, monitoring.TopologyClosedEvent): return False, "Expected TopologyClosedEvent, got %s" % (actual.__class__) else: return False, "Incorrect event: expected %s, actual %s" % (expected_type, actual) return True, "" def compare_multiple_events(i, expected_results, actual_results): events_in_a_row = [] j = i while j < len(expected_results) and isinstance(actual_results[j], actual_results[i].__class__): events_in_a_row.append(actual_results[j]) j += 1 message = "" for event in events_in_a_row: for k in range(i, j): passed, message = compare_events(expected_results[k], event) if passed: expected_results[k] = None break else: return i, False, message return j, True, "" class TestAllScenarios(IntegrationTest): def setUp(self): super(TestAllScenarios, self).setUp() self.all_listener = ServerAndTopologyEventListener() def create_test(scenario_def): def run_scenario(self): with client_knobs(events_queue_frequency=0.1): _run_scenario(self) def _run_scenario(self): class NoopMonitor(Monitor): """Override the _run method to do nothing.""" def _run(self): time.sleep(0.05) m = MongoClient( host=scenario_def["uri"], port=27017, event_listeners=[self.all_listener], _monitor_class=NoopMonitor, ) topology = m._get_topology() try: for phase in scenario_def["phases"]: for (source, response) in phase.get("responses", []): source_address = clean_node(source) topology.on_change( ServerDescription( address=source_address, hello=Hello(response), round_trip_time=0 ) ) expected_results = phase["outcome"]["events"] expected_len = len(expected_results) wait_until( lambda: len(self.all_listener.results) >= expected_len, "publish all events", timeout=15, ) # Wait some time to catch possible lagging extra events. time.sleep(0.5) i = 0 while i < expected_len: result = ( self.all_listener.results[i] if len(self.all_listener.results) > i else None ) # The order of ServerOpening/ClosedEvents doesn't matter if isinstance( result, (monitoring.ServerOpeningEvent, monitoring.ServerClosedEvent) ): i, passed, message = compare_multiple_events( i, expected_results, self.all_listener.results ) self.assertTrue(passed, message) else: self.assertTrue(*compare_events(expected_results[i], result)) i += 1 # Assert no extra events. extra_events = self.all_listener.results[expected_len:] if extra_events: self.fail("Extra events %r" % (extra_events,)) self.all_listener.reset() finally: m.close() return run_scenario def create_tests(): for dirpath, _, filenames in os.walk(_TEST_PATH): for filename in filenames: with open(os.path.join(dirpath, filename)) as scenario_stream: scenario_def = json.load(scenario_stream, object_hook=object_hook) # Construct test from scenario. new_test = create_test(scenario_def) test_name = "test_%s" % (os.path.splitext(filename)[0],) new_test.__name__ = test_name setattr(TestAllScenarios, new_test.__name__, new_test) create_tests() class TestSdamMonitoring(IntegrationTest): knobs: client_knobs listener: ServerAndTopologyEventListener test_client: MongoClient coll: Collection @classmethod @client_context.require_failCommand_fail_point def setUpClass(cls): super(TestSdamMonitoring, cls).setUpClass() # Speed up the tests by decreasing the event publish frequency. cls.knobs = client_knobs(events_queue_frequency=0.1) cls.knobs.enable() cls.listener = ServerAndTopologyEventListener() retry_writes = client_context.supports_transactions() cls.test_client = rs_or_single_client( event_listeners=[cls.listener], retryWrites=retry_writes ) cls.coll = cls.test_client[cls.client.db.name].test cls.coll.insert_one({}) @classmethod def tearDownClass(cls): cls.test_client.close() cls.knobs.disable() super(TestSdamMonitoring, cls).tearDownClass() def setUp(self): self.listener.reset() def _test_app_error(self, fail_command_opts, expected_error): address = self.test_client.address # Test that an application error causes a ServerDescriptionChangedEvent # to be published. data = {"failCommands": ["insert"]} data.update(fail_command_opts) fail_insert = { "configureFailPoint": "failCommand", "mode": {"times": 1}, "data": data, } with self.fail_point(fail_insert): if self.test_client.options.retry_writes: self.coll.insert_one({}) else: with self.assertRaises(expected_error): self.coll.insert_one({}) self.coll.insert_one({}) def marked_unknown(event): return ( isinstance(event, monitoring.ServerDescriptionChangedEvent) and event.server_address == address and not event.new_description.is_server_type_known ) def discovered_node(event): return ( isinstance(event, monitoring.ServerDescriptionChangedEvent) and event.server_address == address and not event.previous_description.is_server_type_known and event.new_description.is_server_type_known ) def marked_unknown_and_rediscovered(): return ( len(self.listener.matching(marked_unknown)) >= 1 and len(self.listener.matching(discovered_node)) >= 1 ) # Topology events are published asynchronously wait_until(marked_unknown_and_rediscovered, "rediscover node") # Expect a single ServerDescriptionChangedEvent for the network error. marked_unknown_events = self.listener.matching(marked_unknown) self.assertEqual(len(marked_unknown_events), 1, marked_unknown_events) self.assertIsInstance(marked_unknown_events[0].new_description.error, expected_error) def test_network_error_publishes_events(self): self._test_app_error({"closeConnection": True}, ConnectionFailure) # In 4.4+, not primary errors from failCommand don't cause SDAM state # changes because topologyVersion is not incremented. @client_context.require_version_max(4, 3) def test_not_primary_error_publishes_events(self): self._test_app_error( {"errorCode": 10107, "closeConnection": False, "errorLabels": ["RetryableWriteError"]}, NotPrimaryError, ) def test_shutdown_error_publishes_events(self): self._test_app_error( {"errorCode": 91, "closeConnection": False, "errorLabels": ["RetryableWriteError"]}, NotPrimaryError, ) if __name__ == "__main__": unittest.main()