07/24/2025 01:55:14.759 7fac851c78d0 [contrail-database-nodemgr] [ERROR]: Cannot write http_port 8103 to /tmp/contrail-database-nodemgr.0.http_port 07/24/2025 01:55:14.759 7fac851c78d0 [contrail-database-nodemgr] [ERROR]: Starting Introspect on HTTP Port 8103 07/24/2025 01:55:14.761 7fac851c8240 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ , ] status = Down description = none to Idle on EvStart >>, ] description = Collector:Collector[none to Idle on EvStart] connection down >>, ] >> 07/24/2025 01:55:14.761 7fac851c8240 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] SandeshModuleClientTrace: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local:Database:contrail-database-nodemgr:0 client_info = << status = Idle successful_connections = 0 pid = 1 http_port = 8103 start_time = 1753322114760854 collector_name = collector_ip = collector_list = [ 10.0.0.48:8086, ] >> sm_queue_count = 1 max_sm_queue_count = 1 >> 07/24/2025 01:55:15.019 7fac8da55a20 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local build_info = {"build-info" : [{"build-version" : "nightly", "build-time" : "2025-07-24 00:50:54.122473", "build-user" : "root", "build-hostname" : "jenkins-build-prepare-sandbox-10063-1.novalocal", "build-id" : "nightly", "build-number" : "nightly.el7"}]} system_cpu_info = << num_socket = 1 num_cpu = 4 num_core_per_socket = 4 num_thread_per_core = 1 >> running_package_version = nightly-nightly.el7 installed_package_version = nightly-nightly.el7 >> 07/24/2025 01:55:15.022 7fac84fa1cc0 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ , ] status = Down description = none to Idle on EvStart >>, ] description = Collector:Collector[none to Idle on EvStart] connection down >>, ] >> 07/24/2025 01:55:15.022 7fac84fa1cc0 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local deleted = False process_info = [ << process_name = cassandra process_state = PROCESS_STATE_EXITED start_count = 0 stop_count = 0 exit_count = 0 last_start_time = last_stop_time = last_exit_time = core_file_list = [ ] >>, << process_name = contrail-query-engine process_state = PROCESS_STATE_EXITED start_count = 0 stop_count = 0 exit_count = 0 last_start_time = last_stop_time = last_exit_time = core_file_list = [ ] >>, << process_name = contrail-database-nodemgr process_state = PROCESS_STATE_RUNNING start_count = 1 stop_count = 0 exit_count = 0 last_start_time = 1753322113000000 last_stop_time = last_exit_time = core_file_list = [ ] >>, ] build_info = {"build-info" : [{"build-version" : "nightly", "build-time" : "2025-07-24 00:50:54.122473", "build-user" : "root", "build-hostname" : "jenkins-build-prepare-sandbox-10063-1.novalocal", "build-id" : "nightly", "build-number" : "nightly.el7"}]} >> 07/24/2025 01:55:15.216 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get database usage, will retry: cassandra 07/24/2025 01:55:15.341 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get database usage, will retry: cassandra 07/24/2025 01:55:15.488 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get database usage, will retry: cassandra 07/24/2025 01:55:15.674 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get database usage, giving up: cassandra 07/24/2025 01:55:15.831 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to connect to database by CQL and socket: cassandra 07/24/2025 01:55:15.833 7fac850ce048 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ , ] status = Down description = none to Idle on EvStart >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[none to Idle on EvStart] connection down >>, ] >> 07/24/2025 01:55:15.976 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get nodetool compactionstats: cassandra 07/24/2025 01:55:15.984 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes' 07/24/2025 01:55:17.708 7fac850ce0f0 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local disk_usage_info = { /dev/vda4 : << partition_type = xfs partition_space_used_1k = 10162752 partition_space_available_1k = 72528300 percentage_partition_space_used = 12 >> } process_mem_cpu_usage = { contrail-database-nodemgr : << mem_virt = 50576 cpu_share = 0.0 mem_res = 40316 >> } system_mem_usage = << total = 16111704 used = 5496228 free = 1288088 buffers = 5136 cached = 9322252 node_type = database-node >> system_cpu_usage = << one_min_avg = 4.35 five_min_avg = 1.4 fifteen_min_avg = 0.5 cpu_share = 0 node_type = database-node >> >> 07/24/2025 01:55:18.763 7fac85023588 [contrail-database-nodemgr] [ERROR]: Session Event: TCP Connect Fail 07/24/2025 01:55:18.763 7fac85023588 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Initializing description = Idle to Connect on EvIdleHoldTimerExpired >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Idle to Connect on EvIdleHoldTimerExpired] connection down >>, ] >> 07/24/2025 01:55:18.763 7fac85023588 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Down description = Connect to Idle on EvTcpConnectFail >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Connect to Idle on EvTcpConnectFail] connection down >>, ] >> 07/24/2025 01:55:18.763 7fac85023588 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] SandeshModuleClientTrace: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local:Database:contrail-database-nodemgr:0 client_info = << status = Idle successful_connections = 0 pid = 1 http_port = 8103 start_time = 1753322114760854 collector_name = collector_ip = 10.0.0.48:8086 collector_list = [ 10.0.0.48:8086, ] >> sm_queue_count = 1 max_sm_queue_count = 2 >> 07/24/2025 01:55:22.768 7fac85023588 [contrail-database-nodemgr] [ERROR]: Session Event: TCP Connect Fail 07/24/2025 01:55:22.768 7fac85023588 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Initializing description = Idle to Connect on EvIdleHoldTimerExpired >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Idle to Connect on EvIdleHoldTimerExpired] connection down >>, ] >> 07/24/2025 01:55:22.768 7fac85023588 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Down description = Connect to Idle on EvTcpConnectFail >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Connect to Idle on EvTcpConnectFail] connection down >>, ] >> 07/24/2025 01:55:22.768 7fac85023588 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] SandeshModuleClientTrace: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local:Database:contrail-database-nodemgr:0 client_info = << status = Idle successful_connections = 0 pid = 1 http_port = 8103 start_time = 1753322114760854 collector_name = collector_ip = 10.0.0.48:8086 collector_list = [ 10.0.0.48:8086, ] >> sm_queue_count = 1 max_sm_queue_count = 2 >> 07/24/2025 01:55:26.775 7fac85023588 [contrail-database-nodemgr] [ERROR]: Session Event: TCP Connect Fail 07/24/2025 01:55:26.775 7fac85023588 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Initializing description = Idle to Connect on EvIdleHoldTimerExpired >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Idle to Connect on EvIdleHoldTimerExpired] connection down >>, ] >> 07/24/2025 01:55:26.780 7fac85023588 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Down description = Connect to Idle on EvTcpConnectFail >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Connect to Idle on EvTcpConnectFail] connection down >>, ] >> 07/24/2025 01:55:26.781 7fac85023588 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] SandeshModuleClientTrace: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local:Database:contrail-database-nodemgr:0 client_info = << status = Idle successful_connections = 0 pid = 1 http_port = 8103 start_time = 1753322114760854 collector_name = collector_ip = 10.0.0.48:8086 collector_list = [ 10.0.0.48:8086, ] >> sm_queue_count = 1 max_sm_queue_count = 2 >> 07/24/2025 01:55:30.782 7fac7fc24828 [contrail-database-nodemgr] [ERROR]: Session Event: TCP Connect Fail 07/24/2025 01:55:30.782 7fac7fc24828 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Initializing description = Idle to Connect on EvIdleHoldTimerExpired >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Idle to Connect on EvIdleHoldTimerExpired] connection down >>, ] >> 07/24/2025 01:55:30.783 7fac7fc24828 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Down description = Connect to Idle on EvTcpConnectFail >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Connect to Idle on EvTcpConnectFail] connection down >>, ] >> 07/24/2025 01:55:30.783 7fac7fc24828 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] SandeshModuleClientTrace: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local:Database:contrail-database-nodemgr:0 client_info = << status = Idle successful_connections = 0 pid = 1 http_port = 8103 start_time = 1753322114760854 collector_name = collector_ip = 10.0.0.48:8086 collector_list = [ 10.0.0.48:8086, ] >> sm_queue_count = 1 max_sm_queue_count = 2 >> 07/24/2025 01:55:31.192 7fac8824dac8 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local deleted = False process_info = [ << process_name = cassandra process_state = PROCESS_STATE_RUNNING start_count = 1 stop_count = 0 exit_count = 0 last_start_time = 1753322131191397 last_stop_time = last_exit_time = core_file_list = [ ] >>, << process_name = contrail-query-engine process_state = PROCESS_STATE_EXITED start_count = 0 stop_count = 0 exit_count = 0 last_start_time = last_stop_time = last_exit_time = core_file_list = [ ] >>, << process_name = contrail-database-nodemgr process_state = PROCESS_STATE_RUNNING start_count = 1 stop_count = 0 exit_count = 0 last_start_time = 1753322113000000 last_stop_time = last_exit_time = core_file_list = [ ] >>, ] build_info = {"build-info" : [{"build-version" : "nightly", "build-time" : "2025-07-24 00:50:54.122473", "build-user" : "root", "build-hostname" : "jenkins-build-prepare-sandbox-10063-1.novalocal", "build-id" : "nightly", "build-number" : "nightly.el7"}]} >> 07/24/2025 01:55:34.787 7fac84f97c18 [contrail-database-nodemgr] [ERROR]: Session Event: TCP Connect Fail 07/24/2025 01:55:34.788 7fac84f97c18 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Initializing description = Idle to Connect on EvIdleHoldTimerExpired >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Idle to Connect on EvIdleHoldTimerExpired] connection down >>, ] >> 07/24/2025 01:55:34.788 7fac84f97c18 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Down description = Connect to Idle on EvTcpConnectFail >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Connect to Idle on EvTcpConnectFail] connection down >>, ] >> 07/24/2025 01:55:34.788 7fac84f97c18 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] SandeshModuleClientTrace: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local:Database:contrail-database-nodemgr:0 client_info = << status = Idle successful_connections = 0 pid = 1 http_port = 8103 start_time = 1753322114760854 collector_name = collector_ip = 10.0.0.48:8086 collector_list = [ 10.0.0.48:8086, ] >> sm_queue_count = 1 max_sm_queue_count = 2 >> 07/24/2025 01:55:38.798 7fac84f97c18 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Initializing description = Idle to Connect on EvIdleHoldTimerExpired >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Idle to Connect on EvIdleHoldTimerExpired] connection down >>, ] >> 07/24/2025 01:55:41.118 7fac84f97f60 [contrail-database-nodemgr] [ERROR]: Session Event: TCP Connection Closed 07/24/2025 01:55:41.119 7fac84f97c18 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Down description = ClientInit to Idle on EvTcpClose >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[ClientInit to Idle on EvTcpClose] connection down >>, ] >> 07/24/2025 01:55:41.119 7fac84f97c18 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] SandeshModuleClientTrace: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local:Database:contrail-database-nodemgr:0 client_info = << status = Idle successful_connections = 1 pid = 1 http_port = 8103 start_time = 1753322114760854 collector_name = collector_ip = 10.0.0.48:8086 collector_list = [ 10.0.0.48:8086, ] >> sm_queue_count = 1 max_sm_queue_count = 2 >> 07/24/2025 01:55:45.126 7fac84f97c18 [contrail-database-nodemgr] [ERROR]: SANDESH: [DROP: WrongClientSMState] NodeStatusUVE: data = << name = cn-jenkins-deploy-platform-k8s-manifests-230-1.cluster.local process_status = [ << module_id = contrail-database-nodemgr instance_id = 0 state = Non-Functional connection_infos = [ << type = Collector name = Collector server_addrs = [ 10.0.0.48:8086, ] status = Initializing description = Idle to Connect on EvIdleHoldTimerExpired >>, ] description = Cassandra state detected DOWN. Disk space for DB not retrievable. Collector:Collector[Idle to Connect on EvIdleHoldTimerExpired] connection down >>, ] >> 07/24/2025 01:56:17.901 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to connect to database by CQL and socket: Result: 1 07/24/2025 01:56:23.626 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes' 07/24/2025 01:57:19.056 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes' 07/24/2025 01:58:18.924 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes' 07/24/2025 01:59:18.872 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes' 07/24/2025 02:00:19.843 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes' 07/24/2025 02:01:19.074 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes' 07/24/2025 02:02:19.119 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes' 07/24/2025 02:03:19.253 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes' 07/24/2025 02:04:19.429 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes' 07/24/2025 02:05:18.983 7fac878c9608 [contrail-database-nodemgr] [ERROR]: Failed to get core files: [Errno 2] No such file or directory: '/var/crashes'