@LaSoe: I did some recheck with the corrupted spool files and didn’t find any problems with them, also putting them into the spool directory will do notification of them.
Unfortunately, we are currently affected by a hanging site again and are still trying to figure out the root cause. It seems to be related to the multisite.mk and the licensing, the apache process is waiting to acquire a lock. Probably the notification is a side-effect of this.
One of the last things we found in web.log is this:
024-06-16 16:55:02,388 [40] [cmk.web 2408411] Exception (kd1284, discovered_host_label_sync)
Traceback (most recent call last):
File "/omd/sites/main/lib/python3/cmk/gui/watolib/host_label_sync.py", line 229, in _execute_site_sync
raw_result = do_remote_automation(
^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/gui/watolib/automations.py", line 349, in do_remote_automation
serialized_response = _do_remote_automation_serialized(
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/gui/watolib/automations.py", line 297, in _do_remote_automation_serialized
response = get_url(
^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/gui/watolib/automations.py", line 514, in get_url
return get_url_raw(url, insecure, auth, data, files, timeout).text
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/gui/watolib/automations.py", line 387, in get_url_raw
"x-checkmk-license-state": get_license_state().readable,
^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/utils/licensing/registry.py", line 73, in get_license_state
return _make_licensing_handler().state
^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/utils/licensing/registry.py", line 49, in _make_licensing_handler
return _get_licensing_handler().make()
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/utils/cee/licensing/cce_handler.py", line 882, in make
state_file_creation_time = read_creation_time(omd_root)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/utils/cee/licensing/init_state_creation.py", line 27, in read_creation_time
with locked(state_file_path):
File "/omd/sites/main/lib/python3.12/contextlib.py", line 137, in __enter__
return next(self.gen)
^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/utils/store/_locks.py", line 144, in locked
acquired = acquire_lock(path, blocking)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/utils/store/_locks.py", line 171, in acquire_lock
with _open_lock_file(path) as fd_new:
File "/omd/sites/main/lib/python3.12/contextlib.py", line 144, in __exit__
next(self.gen)
File "/omd/sites/main/lib/python3/cmk/utils/store/_locks.py", line 186, in _open_lock_file
os.close(fd)
OSError: [Errno 9] Bad file descriptor
2024-06-16 16:55:02,557 [40] [cmk.web 2408411] Exception (kd4426, discovered_host_label_sync)
Traceback (most recent call last):
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/connectionpool.py", line 715, in urlopen
httplib_response = self._make_request(
^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/connectionpool.py", line 404, in _make_request
self._validate_conn(conn)
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/connectionpool.py", line 1058, in _validate_conn
conn.connect()
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/connection.py", line 419, in connect
self.sock = ssl_wrap_socket(
^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/util/ssl_.py", line 449, in ssl_wrap_socket
ssl_sock = _ssl_wrap_socket_impl(
^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/util/ssl_.py", line 493, in _ssl_wrap_socket_impl
return ssl_context.wrap_socket(sock, server_hostname=server_hostname)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/ssl.py", line 455, in wrap_socket
return self.sslsocket_class._create(
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/ssl.py", line 960, in _create
if sock.getsockopt(SOL_SOCKET, SO_TYPE) != SOCK_STREAM:
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
OSError: [Errno 88] Socket operation on non-socket
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "/omd/sites/main/lib/python3.12/site-packages/requests/adapters.py", line 486, in send
resp = conn.urlopen(
^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/connectionpool.py", line 799, in urlopen
retries = retries.increment(
^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/util/retry.py", line 550, in increment
raise six.reraise(type(error), error, _stacktrace)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/packages/six.py", line 769, in reraise
raise value.with_traceback(tb)
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/connectionpool.py", line 715, in urlopen
httplib_response = self._make_request(
^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/connectionpool.py", line 404, in _make_request
self._validate_conn(conn)
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/connectionpool.py", line 1058, in _validate_conn
conn.connect()
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/connection.py", line 419, in connect
self.sock = ssl_wrap_socket(
^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/util/ssl_.py", line 449, in ssl_wrap_socket
ssl_sock = _ssl_wrap_socket_impl(
^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/urllib3/util/ssl_.py", line 493, in _ssl_wrap_socket_impl
return ssl_context.wrap_socket(sock, server_hostname=server_hostname)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/ssl.py", line 455, in wrap_socket
return self.sslsocket_class._create(
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/ssl.py", line 960, in _create
if sock.getsockopt(SOL_SOCKET, SO_TYPE) != SOCK_STREAM:
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
urllib3.exceptions.ProtocolError: ('Connection aborted.', OSError(88, 'Socket operation on non-socket'))
During handling of the above exception, another exception occurred:
Traceback (most recent call last):
File "/omd/sites/main/lib/python3/cmk/gui/watolib/host_label_sync.py", line 229, in _execute_site_sync
raw_result = do_remote_automation(
^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/gui/watolib/automations.py", line 349, in do_remote_automation
serialized_response = _do_remote_automation_serialized(
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/gui/watolib/automations.py", line 297, in _do_remote_automation_serialized
response = get_url(
^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/gui/watolib/automations.py", line 514, in get_url
return get_url_raw(url, insecure, auth, data, files, timeout).text
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3/cmk/gui/watolib/automations.py", line 377, in get_url_raw
response = requests.post(
^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/requests/api.py", line 115, in post
return request("post", url, data=data, json=json, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/requests/api.py", line 59, in request
return session.request(method=method, url=url, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/requests/sessions.py", line 589, in request
resp = self.send(prep, **send_kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/requests/sessions.py", line 703, in send
r = adapter.send(request, **kwargs)
^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
File "/omd/sites/main/lib/python3.12/site-packages/requests/adapters.py", line 501, in send
raise ConnectionError(err, request=request)
requests.exceptions.ConnectionError: ('Connection aborted.', OSError(88, 'Socket operation on non-socket'))
...
Is someone else with a MSP Edition also having this or does someone have an idea what to look for? Our impression is it got worse after adding more customers and sites.
Kind Regards
Andreas