4 # Copyright (c) 2013-2024 Wind River Systems, Inc.
6 # SPDX-License-Identifier: Apache-2.0
9 ############################################################################
11 # ALARM & CUSTOMER LOG DOCUMENTATION
13 ############################################################################
15 ############################################################################
17 # Record Format ... for documentation
20 # Type: < Alarm | Log >
21 # Description: < yaml string >
23 # [ < yaml string >, // list of yaml strings
26 # critical: < yaml string > // i.e. dictionary of yaml strings indexed by severity
27 # major: < yaml string >
28 # minor: < yaml string >
29 # warning: < yaml string >
30 # Entity_Instance_ID: < yaml string ... e.g. host=<hostname>.interface=<ifname> >
32 # [ < yaml string >, // list of yaml strings
34 # Severity: < critical | major | minor | warning >
36 # [ critical, major ] // list of severity values
37 # Proposed_Repair_Action: < yaml string > // NOTE ALARM ONLY FIELD
39 # critical: < yaml string > // i.e. dictionary of yaml strings indexed by severity
40 # major: < yaml string >
41 # minor: < yaml string >
42 # warning: < yaml string >
43 # Maintenance_Action: < yaml string > // NOTE ALARM ONLY FIELD
45 # critical: < yaml string > // i.e. dictionary of yaml strings indexed by severity
46 # major: < yaml string >
47 # minor: < yaml string >
48 # warning: < yaml string >
49 # Inhibit_Alarms: < True | False > // NOTE ALARM ONLY FIELD
50 # Alarm_Type: < operational-violation | ... >
51 # Probable_Cause: < timing-problem | ... >
53 # [ < timing-problem | ... >, // list of probable-causes
54 # < timing-problem | ... > ]
55 # Service_Affecting: < True | False >
56 # Suppression: < True | False > // NOTE ALARM ONLY FIELD
57 # Management_Affecting_Severity: < none | critical | major | minor | warning >
58 # // lowest alarm level of this type that will block forced upgrades & orchestration actions
59 # Degrade_Affecting_Severity: < none | critical | major | minor >
60 # // lowest alarm level of this type sets a host to 'degraded'
61 # Context: < none | starlingx | openstack >
62 # // Identifies where the alarm/log is used. If it should be ignored by
63 # // the documentation generating scripts, the value has to be 'none'.
64 # // If any of the other values is used, the alarm/log will be included
65 # // in the documentation and classified by the chosen value.
69 # - use general record format above
70 # - the only dictionaries allowed are ones indexed by severity
71 # - if there are multiple lists in a record,
72 # then they should all have the same # of items and corresponding list items represent instance of alarm
73 # - if you can't describe the alarm/log based on the above rules,
74 # then you can use a multi-line string format
75 # - DELETING alarms from events.yaml: alarms should only be deleted when going to a new Titanium Cloud release
76 # - if all possible alarm severities are mgmt affecting, the convention is to
77 # use 'warning' as the Management_Affecting_Severity, even if warning is not a possible severity for that alarm
80 # - Testing of events.yaml can be done by running regular make command
81 # and specifying fm-doc:
82 # nice -n 20 ionice -c Idle make -C build fm-doc.rebuild
83 # - When building, events.yaml will be parsed for correct format, and also
84 # to ensure that Alarm IDs defined in constants.py and fmAlarm.h are
85 # listed in events.yaml
87 ############################################################################
90 #---------------------------------------------------------------------------
91 # Monitored Resource Alarms
92 #---------------------------------------------------------------------------
98 Platform CPU threshold exceeded; threshold x%, actual y% .
101 Entity_Instance_ID: host=<hostname>
102 Severity: [critical, major]
103 Proposed_Repair_Action: "Monitor and if condition persists, contact next level of support."
108 Alarm_Type: operational-violation
109 Probable_Cause: threshold-crossed
110 Service_Affecting: False
112 Management_Affecting_Severity: major
113 Degrade_Affecting_Severity: critical
119 VSwitch CPU threshold exceeded; threshold x%, actual y% .
123 Entity_Instance_ID: host=<hostname>
124 Severity: [critical, major, minor]
125 Proposed_Repair_Action: "Monitor and if condition persists, contact next level of support."
130 Alarm_Type: operational-violation
131 Probable_Cause: threshold-crossed
132 Service_Affecting: False
134 Management_Affecting_Severity: none
135 Degrade_Affecting_Severity: none
141 Memory threshold exceeded; threshold x%, actual y% .
144 Entity_Instance_ID: |-
147 host=<hostname>.memory=total
149 host=<hostname>.memory=platform
151 host=<hostname>.numa=node<number>
152 Severity: [critical, major]
153 Proposed_Repair_Action: "Monitor and if condition persists, contact next level of support; may require additional memory on Host."
158 Alarm_Type: operational-violation
159 Probable_Cause: threshold-crossed
160 Service_Affecting: False
162 Management_Affecting_Severity: none
163 Degrade_Affecting_Severity: critical
166 100.104: # NOTE This should really be split into two different Alarms.
169 host=<hostname>.filesystem=<mount-dir>
170 File System threshold exceeded; threshold x%, actual y% .
174 host=<hostname>.volumegroup=<volumegroup-name>
175 Monitor and if condition persists, consider adding additional physical volumes to the volume group.
176 Entity_Instance_ID: |-
177 host=<hostname>.filesystem=<mount-dir>
179 host=<hostname>.volumegroup=<volumegroup-name>
180 Severity: [critical, major]
181 Proposed_Repair_Action: "Reduce usage or resize filesystem."
186 Alarm_Type: operational-violation
187 Probable_Cause: threshold-crossed
188 Service_Affecting: False
190 Management_Affecting_Severity: critical
191 Degrade_Affecting_Severity: critical
197 Filesystem Alarm Condition:
198 <fs_name> filesystem is not added on both controllers and/or does not have the same size: <hostname>.
199 Entity_Instance_ID: fs_name=<image-conversion>
201 Proposed_Repair_Action: "Add image-conversion filesystem on both controllers.
202 See the |prod-long| documentation at |docs-url| for more details.
203 If problem persists, contact next level of support."
204 Maintenance_Action: degrade
206 Alarm_Type: equipment
207 Probable_Cause: configuration-or-customization-error
208 Service_Affecting: True
210 Management_Affecting_Severity: major
211 Degrade_Affecting_Severity: none
215 # 100.105: Retired (with R2 release): previously monitored /etc/nova/instances
216 # NFS mount from controller to computes
221 Description: "'OAM' Port failed."
222 Entity_Instance_ID: host=<hostname>.port=<port-name>
224 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
225 Maintenance_Action: degrade
227 Alarm_Type: operational-violation
228 Probable_Cause: unknown
229 Service_Affecting: True
231 Management_Affecting_Severity: warning
232 Degrade_Affecting_Severity: major
238 'OAM' Interface degraded.
240 'OAM' Interface failed.
241 Entity_Instance_ID: host=<hostname>.interface=<if-name>
242 Severity: [critical, major]
243 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
248 Alarm_Type: operational-violation
249 Probable_Cause: unknown
250 Service_Affecting: True
252 Management_Affecting_Severity: warning
253 Degrade_Affecting_Severity: major
258 Description: "'MGMT' Port failed."
259 Entity_Instance_ID: host=<hostname>.port=<port-name>
261 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
262 Maintenance_Action: degrade
264 Alarm_Type: operational-violation
265 Probable_Cause: unknown
266 Service_Affecting: True
268 Management_Affecting_Severity: warning
269 Degrade_Affecting_Severity: major
275 'MGMT' Interface degraded.
277 'MGMT' Interface failed.
278 Entity_Instance_ID: host=<hostname>.interface=<if-name>
279 Severity: [critical, major]
280 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
285 Alarm_Type: operational-violation
286 Probable_Cause: unknown
287 Service_Affecting: True
289 Management_Affecting_Severity: warning
290 Degrade_Affecting_Severity: major
295 Description: "'CLUSTER-HOST' Port failed."
296 Entity_Instance_ID: host=<hostname>.port=<port-name>
298 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
299 Maintenance_Action: degrade
301 Alarm_Type: operational-violation
302 Probable_Cause: unknown
303 Service_Affecting: True
305 Management_Affecting_Severity: warning
306 Degrade_Affecting_Severity: major
312 'CLUSTER-HOST' Interface degraded.
314 'CLUSTER-HOST' Interface failed.
315 Entity_Instance_ID: host=<hostname>.interface=<if-name>
316 Severity: [critical, major]
317 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
322 Alarm_Type: operational-violation
323 Probable_Cause: unknown
324 Service_Affecting: True
326 Management_Affecting_Severity: warning
327 Degrade_Affecting_Severity: major
332 Description: "'DATA-VRS' Port down."
333 Entity_Instance_ID: host=<hostname>.port=<port-name>
335 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
336 Maintenance_Action: degrade
338 Alarm_Type: operational-violation
339 Probable_Cause: unknown
340 Service_Affecting: True
342 Management_Affecting_Severity: none
343 Degrade_Affecting_Severity: major
349 'DATA-VRS' Interface degraded.
351 'DATA-VRS' Interface down.
352 Entity_Instance_ID: host=<hostname>.interface=<if-name>
353 Severity: [critical, major]
354 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
358 Alarm_Type: operational-violation
359 Probable_Cause: unknown
360 Service_Affecting: True
362 Management_Affecting_Severity: none
363 Degrade_Affecting_Severity: major
369 major: "NTP configuration does not contain any valid or reachable NTP servers."
370 minor: "NTP address <IP address> is not a valid or a reachable NTP server."
372 major: host=<hostname>.ntp
373 minor: host=<hostname>.ntp=<IP address>
374 Severity: [major, minor]
375 Proposed_Repair_Action: "Monitor and if condition persists, contact next level of support."
376 Maintenance_Action: none
378 Alarm_Type: communication
379 Probable_Cause: unknown
380 Service_Affecting: False
382 Management_Affecting_Severity: none
383 Degrade_Affecting_Severity: none
388 Description: "VSwitch Memory Usage, processor <processor> threshold exceeded; threshold x%, actual y% ."
389 Entity_Instance_ID: host=<hostname>.processor=<processor>
390 Severity: [critical, major, minor]
391 Proposed_Repair_Action: "Monitor and if condition persists, contact next level of support."
396 Alarm_Type: operational-violation
397 Probable_Cause: threshold-crossed
398 Service_Affecting: False
400 Management_Affecting_Severity: none
401 Degrade_Affecting_Severity: critical
406 Description: "Cinder LVM Thinpool Usage threshold exceeded; threshold x%, actual y% ."
407 Entity_Instance_ID: host=<hostname>
408 Severity: [critical, major, minor]
409 Proposed_Repair_Action: "Monitor and if condition persists, contact next level of support."
414 Alarm_Type: operational-violation
415 Probable_Cause: threshold-crossed
416 Service_Affecting: False
418 Management_Affecting_Severity: none
419 Degrade_Affecting_Severity: critical
424 Description: "Nova LVM Thinpool Usage threshold exceeded; threshold x%, actual y% ."
425 Entity_Instance_ID: host=<hostname>
426 Severity: [critical, major, minor]
427 Proposed_Repair_Action: "Monitor and if condition persists, contact next level of support."
432 Alarm_Type: operational-violation
433 Probable_Cause: threshold-crossed
434 Service_Affecting: False
436 Management_Affecting_Severity: major
437 Degrade_Affecting_Severity: critical
442 Description: Controller cannot establish connection with remote logging server.
443 Entity_Instance_ID: host=<hostname>
445 Proposed_Repair_Action: "Ensure Remote Log Server IP is reachable from Controller through OAM interface; otherwise contact next level of support."
446 Maintenance_Action: none
447 Inhibit_Alarms: False
448 Alarm_Type: communication
449 Probable_Cause: communication-subsystem-failure
450 Service_Affecting: False
452 Management_Affecting_Severity: none
453 Degrade_Affecting_Severity: none
459 <hostname> does not support the provisioned PTP mode
461 <hostname> PTP clocking is out-of-tolerance
463 <hostname> is not locked to remote PTP Primary source
465 <hostname> GNSS signal loss state:<state>
467 <hostname> 1PPS signal loss state:<state>
468 Entity_Instance_ID: |-
471 host=<hostname>.ptp=no-lock
473 host=<hostname>.ptp=<interface>.unsupported=hardware-timestamping
475 host=<hostname>.ptp=<interface>.unsupported=software-timestamping
477 host=<hostname>.ptp=<interface>.unsupported=legacy-timestamping
479 host=<hostname>.ptp=out-of-tolerance
481 host=<hostname>.instance=<instance>.ptp=out-of-tolerance
483 host=<hostname>.interface=<interface>.ptp=signal-loss
484 Severity: [major, minor]
485 Proposed_Repair_Action: "Monitor and if condition persists, contact next level of support."
486 Maintenance_Action: none
488 Alarm_Type: communication
489 Probable_Cause: unknown
490 Service_Affecting: False
492 Management_Affecting_Severity: none
493 Degrade_Affecting_Severity: none
498 Description: Controllers running mismatched kernels.
499 Entity_Instance_ID: host=<hostname>.kernel=<kernel>
501 Proposed_Repair_Action: "Modify controllers using 'system host-kernel-modify' so that both are running the desired 'standard' or 'lowlatency' kernel."
502 Maintenance_Action: none
503 Inhibit_Alarms: False
504 Alarm_Type: equipment
505 Probable_Cause: unspecified-reason
506 Service_Affecting: False
508 Management_Affecting_Severity: none
509 Degrade_Affecting_Severity: none
514 Description: Host not running the provisioned kernel.
515 Entity_Instance_ID: host=<hostname>.kernel=<kernel>
517 Proposed_Repair_Action: "Retry 'system host-kernel-modify' and if condition persists, contact next level of support."
518 Maintenance_Action: none
519 Inhibit_Alarms: False
520 Alarm_Type: equipment
521 Probable_Cause: unspecified-reason
522 Service_Affecting: False
524 Management_Affecting_Severity: major
525 Degrade_Affecting_Severity: none
531 critical: "service open file descriptor has reached its limit"
532 major: "service open file descriptor is approaching to its limit"
533 Entity_Instance_ID: |-
534 host=<hostname>.resource_type=file-descriptor.service_name=<service-name>
535 Severity: [critical, major]
536 Proposed_Repair_Action: "swact to the other controller if it is available"
537 Maintenance_Action: none
539 Alarm_Type: operational-violation
540 Probable_Cause: threshold-crossed
541 Service_Affecting: True
543 Management_Affecting_Severity: critical
544 Degrade_Affecting_Severity: critical
548 #---------------------------------------------------------------------------
550 #---------------------------------------------------------------------------
555 Description: <hostname> was administratively locked to take it out-of-service.
556 Entity_Instance_ID: host=<hostname>
558 Proposed_Repair_Action: Administratively unlock Host to bring it back in-service.
559 Maintenance_Action: none
561 Alarm_Type: operational-violation
562 Probable_Cause: out-of-service
563 Service_Affecting: True
565 Management_Affecting_Severity: warning
566 Degrade_Affecting_Severity: none
571 Description: <hostname> pxeboot network communication failure.
572 Entity_Instance_ID: host=<hostname>
574 Proposed_Repair_Action: Administratively Lock and Unlock host to recover. If problem persists, contact next level of support.
575 Maintenance_Action: none
576 Inhibit_Alarms: False
577 Alarm_Type: communication
578 Probable_Cause: unknown
579 Service_Affecting: False
581 Management_Affecting_Severity: warning
582 Degrade_Affecting_Severity: none
588 <hostname> experienced a service-affecting failure.
589 Host is being auto recovered by Reboot.
590 Entity_Instance_ID: host=<hostname>
592 Proposed_Repair_Action: If auto-recovery is consistently unable to recover host to the unlocked-enabled state contact next level of support or lock and replace failing host.
593 Maintenance_Action: auto recover
594 Inhibit_Alarms: False
595 Alarm_Type: operational-violation
596 Probable_Cause: application-subsystem-failure
597 Service_Affecting: True
599 Management_Affecting_Severity: warning
600 Degrade_Affecting_Severity: none
605 Description: <hostname> experienced a configuration failure during initialization. Host is being re-configured by Reboot.
606 Entity_Instance_ID: host=<hostname>
608 Proposed_Repair_Action: If auto-recovery is consistently unable to recover host to the unlocked-enabled state contact next level of support or lock and replace failing host.
609 Maintenance_Action: auto-recover
610 Inhibit_Alarms: False
611 Alarm_Type: operational-violation
612 Probable_Cause: configuration-or-customization-error
613 Service_Affecting: True
615 Management_Affecting_Severity: warning
616 Degrade_Affecting_Severity: none
621 Description: <hostname> access to board management module has failed.
622 Entity_Instance_ID: host=<hostname>
624 Proposed_Repair_Action: Check Host's board management configuration and connectivity.
625 Maintenance_Action: auto recover
626 Inhibit_Alarms: False
627 Alarm_Type: operational-violation
628 Probable_Cause: communication-subsystem-failure
629 Service_Affecting: False
631 Management_Affecting_Severity: none
632 Degrade_Affecting_Severity: none
637 Description: <hostname> compute service of the only available controller is not proportional. Auto-recovery is disabled. Degrading host instead.
638 Entity_Instance_ID: host=<hostname>
640 Proposed_Repair_Action: Enable second controller and Switch Activity (Swact) over to it as soon as possible. Then Lock and Unlock host to recover its local compute service.
641 Maintenance_Action: "degrade - requires manual action"
642 Inhibit_Alarms: False
643 Alarm_Type: operational-violation
644 Probable_Cause: communication-subsystem-failure
645 Service_Affecting: True
647 Management_Affecting_Severity: warning
648 Degrade_Affecting_Severity: major
655 <hostname> is experiencing an intermittent 'Management Network' communication failure that have exceeded its lower alarming threshold.
658 <hostname> is experiencing a persistent critical 'Management Network' communication failure."
659 Entity_Instance_ID: host=<hostname>
660 Severity: [critical, major]
661 Proposed_Repair_Action: "Check 'Management Network' connectivity and support for multicast messaging. If problem consistently occurs after that and Host is reset, then contact next level of support or lock and replace failing host."
662 Maintenance_Action: auto recover
663 Inhibit_Alarms: False
664 Alarm_Type: communication
665 Probable_Cause: unknown
666 Service_Affecting: True
668 Management_Affecting_Severity: warning
669 Degrade_Affecting_Severity: none
676 <hostname> is experiencing an intermittent 'Cluster-host Network' communication failures that have exceeded its lower alarming threshold.
679 <hostname> is experiencing a persistent critical 'Cluster-host Network' communication failure."
680 Entity_Instance_ID: host=<hostname>
681 Severity: [critical, major]
682 Proposed_Repair_Action: "Check 'Cluster-host Network' connectivity and support for multicast messaging. If problem consistently occurs after that and Host is reset, then contact next level of support or lock and replace failing host."
683 Maintenance_Action: auto recover
684 Inhibit_Alarms: False
685 Alarm_Type: communication
686 Probable_Cause: unknown
687 Service_Affecting: True
689 Management_Affecting_Severity: warning
690 Degrade_Affecting_Severity: none
697 Main Process Monitor Daemon Failure (major):
698 <hostname> 'Process Monitor' (pmond) process is not running or functioning properly. The system is trying to recover this process.
700 Monitored Process Failure (critical/major/minor):
701 Critical: <hostname> critical '<processname>' process has failed and could not be auto-recovered gracefully.
702 Auto-recovery progression by host reboot is required and in progress.
703 Major: <hostname> is degraded due to the failure of its '<processname>' process. Auto recovery of this major process is in progress.
704 Minor: <hostname> '<processname>' process has failed. Auto recovery of this minor process is in progress.
706 <hostname> '<processname>' process has failed. Manual recovery is required.
707 Entity_Instance_ID: host=<hostname>.process=<processname>
708 Severity: [critical, major, minor]
709 Proposed_Repair_Action: |-
710 If this alarm does not automatically clear after some time and continues to be asserted after Host is locked and unlocked then contact next level of support for root cause analysis and recovery.
712 If problem consistently occurs after Host is locked and unlocked then contact next level of support for root cause analysis and recovery."
714 critical: auto-recover
717 Inhibit_Alarms: False
718 Alarm_Type: operational-violation
719 Probable_Cause: unknown
725 Management_Affecting_Severity: warning
726 Degrade_Affecting_Severity: major
729 # 200.006: // NOTE using duplicate ID of a completely analogous Alarm for this
732 # Main Process Monitor Daemon Failure (major)
733 # <hostname> 'Process Monitor' (pmond) process is not running or functioning properly.
734 # The system is trying to recover this process.
736 # Monitored Process Failure (critical/major/minor)
737 # critical: <hostname> critical '<processname>' process has failed and could not be auto-recovered gracefully.
738 # Auto-recovery progression by host reboot is required and in progress.
739 # major: <hostname> is degraded due to the failure of its '<processname>' process. Auto recovery of this major process is in progress.
740 # minor: <hostname> '<processname>' process has failed. Auto recovery of this minor process is in progress.
742 # <hostname> '<processname>' process has failed. Manual recovery is required.
743 # Entity_Instance_ID: host=<hostname>.process=<process-name>
746 # Probable_Cause: unspecified-reason
747 # Service_Affecting: True
753 critical: "Host is degraded due to a 'critical' out-of-tolerance reading from the '<sensorname>' sensor"
754 major: "Host is degraded due to a 'major' out-of-tolerance reading from the '<sensorname>' sensor"
755 minor: "Host is reporting a 'minor' out-of-tolerance reading from the '<sensorname>' sensor"
756 Entity_Instance_ID: host=<hostname>.sensor=<sensorname>
757 Severity: [critical, major, minor]
758 Proposed_Repair_Action: "If problem consistently occurs after Host is power cycled and or reset, contact next level of support or lock and replace failing host."
762 minor: auto-recover (polling)
764 Alarm_Type: operational-violation
765 Probable_Cause: unspecified-reason
771 Management_Affecting_Severity: none
772 Degrade_Affecting_Severity: critical
777 Description: The Hardware Monitor was unable to load, configure and monitor one or more hardware sensors.
778 Entity_Instance_ID: host=<hostname>
780 Proposed_Repair_Action: Check Board Management Controller provisioning. Try reprovisioning the BMC. If problem persists, try power cycling the host and then the entire server including the BMC power. If problem persists, then contact next level of support.
781 Maintenance_Action: None
782 Inhibit_Alarms: False
783 Alarm_Type: operational-violation
784 Probable_Cause: unknown
785 Service_Affecting: False
787 Management_Affecting_Severity: none
788 Degrade_Affecting_Severity: none
793 Description: Unable to read one or more sensor groups from this host's board management controller
794 Entity_Instance_ID: host=<hostname>
796 Proposed_Repair_Action: Check board management connectivity and try rebooting the board management controller. If problem persists, contact next level of support or lock and replace failing host.
797 Maintenance_Action: None
798 Inhibit_Alarms: False
799 Alarm_Type: operational-violation
800 Probable_Cause: unknown
801 Service_Affecting: False
803 Management_Affecting_Severity: none
804 Degrade_Affecting_Severity: none
809 Description: Issue in creation or unsealing of LUKS volume
810 Entity_Instance_ID: host=<hostname>
812 Proposed_Repair_Action: If auto-recovery is consistently unable to recover host to the unlocked-enabled state contact next level of support or lock and replace failing host.
813 Maintenance_Action: None
814 Inhibit_Alarms: False
815 Alarm_Type: operational-violation
816 Probable_Cause: unknown
817 Service_Affecting: False
819 Management_Affecting_Severity: major
820 Degrade_Affecting_Severity: none
826 <hostname> has been 'discovered' on the network
828 <hostname> has been 'added' to the system
830 <hostname> has 'entered' multi-node failure avoidance
832 <hostname> has 'exited' multi-node failure avoidance
834 host=<hostname>.event=discovered
836 host=<hostname>.event=add
838 host=<hostname>.event=mnfa_enter
840 host=<hostname>.event=mnfa_exit
843 Probable_Cause: unspecified-reason
844 Service_Affecting: True
851 <hostname> board management controller has been 'provisioned'
853 <hostname> board management controller has been 're-provisioned'
855 <hostname> board management controller has been 'de-provisioned'
857 <hostname> manual 'unlock' request
859 <hostname> manual 'reboot' request
861 <hostname> manual 'reset' request
863 <hostname> manual 'power-off' request
865 <hostname> manual 'power-on' request
867 <hostname> manual 'reinstall' request
869 <hostname> manual 'force-lock' request
871 <hostname> manual 'delete' request
873 <hostname> manual 'controller switchover' request
874 Entity_Instance_ID: |-
875 host=<hostname>.command=provision
877 host=<hostname>.command=reprovision
879 host=<hostname>.command=deprovision
881 host=<hostname>.command=unlock
883 host=<hostname>.command=reboot
885 host=<hostname>.command=reset
887 host=<hostname>.command=power-off
889 host=<hostname>.command=power-on
891 host=<hostname>.command=reinstall
893 host=<hostname>.command=force-lock
895 host=<hostname>.command=delete
897 host=<hostname>.command=swact
900 Probable_Cause: unspecified-reason
901 Service_Affecting: False
908 <hostname> is now 'disabled'
910 <hostname> is now 'enabled'
912 <hostname> is now 'online'
914 <hostname> is now 'offline'
916 <hostname> is 'disabled-failed' to the system
918 <hostname> reinstall failed
920 <hostname> reinstall completed successfully
921 Entity_Instance_ID: |-
922 host=<hostname>.state=disabled
924 host=<hostname>.state=enabled
926 host=<hostname>.status=online
928 host=<hostname>.status=offline
930 host=<hostname>.status=failed
932 host=<hostname>.status=reinstall-failed
934 host=<hostname>.status=reinstall-complete
937 Probable_Cause: unspecified-reason
938 Service_Affecting: True
942 #---------------------------------------------------------------------------
944 #---------------------------------------------------------------------------
948 Description: System Backup in progress.
949 Entity_Instance_ID: host=controller
951 Proposed_Repair_Action: No action required.
954 Alarm_Type: operational-violation
955 Probable_Cause: unspecified-reason
956 Service_Affecting: False
958 Management_Affecting_Severity: warning
959 Degrade_Affecting_Severity: none
964 Description: System Restore in progress.
965 Entity_Instance_ID: host=controller
967 Proposed_Repair_Action: Run 'system restore-complete' to complete restore if running restore manually.
970 Alarm_Type: operational-violation
971 Probable_Cause: unspecified-reason
972 Service_Affecting: False
974 Management_Affecting_Severity: warning
975 Degrade_Affecting_Severity: none
979 #---------------------------------------------------------------------------
980 # SYSTEM CONFIGURATION
981 #---------------------------------------------------------------------------
985 Description: <hostname> Configuration is out-of-date.
986 Entity_Instance_ID: host=<hostname>
988 Proposed_Repair_Action: Administratively lock and unlock <hostname> to update config.
991 Alarm_Type: operational-violation
992 Probable_Cause: unspecified-reason
993 Service_Affecting: True
995 Management_Affecting_Severity: warning
996 Degrade_Affecting_Severity: none
1002 Description: "Kubernetes certificates rotation failed on host[, reason = <reason_text>]"
1003 Entity_Instance_ID: host=<hostname>
1005 Proposed_Repair_Action: Lock and unlock the host to update services with new certificates (Manually renew kubernetes certificates first if renewal failed).
1008 Alarm_Type: operational-violation
1009 Probable_Cause: unspecified-reason
1010 Service_Affecting: False
1012 Management_Affecting_Severity: warning
1013 Degrade_Affecting_Severity: none
1018 Description: "IPsec certificates renewal failed on host[, reason = <reason_text>]"
1019 Entity_Instance_ID: host=<hostname>
1021 Proposed_Repair_Action: Check cron.log and ipsec-auth.log, fix the issue and rerun the renewal cron job.
1024 Alarm_Type: operational-violation
1025 Probable_Cause: unspecified-reason
1026 Service_Affecting: False
1028 Management_Affecting_Severity: warning
1029 Degrade_Affecting_Severity: none
1032 #---------------------------------------------------------------------------
1034 #---------------------------------------------------------------------------
1037 Description: "Deployment resource not reconciled: <name>"
1038 Entity_Instance_ID: resource=<crd-resource>,name=<resource-name>
1040 Proposed_Repair_Action: Monitor and if condition persists, validate deployment configuration.
1043 Alarm_Type: operational-violation
1044 Probable_Cause: configuration-out-of-date
1045 Service_Affecting: True
1047 Management_Affecting_Severity: warning
1048 Degrade_Affecting_Severity: none
1053 Description: "Deployment resource not synchronized: <name>"
1054 Entity_Instance_ID: resource=<crd-resource>,name=<resource-name>
1056 Proposed_Repair_Action: Monitor and if condition persists, validate deployment configuration.
1059 Alarm_Type: operational-violation
1060 Probable_Cause: configuration-out-of-date
1061 Service_Affecting: False
1063 Management_Affecting_Severity: none
1064 Degrade_Affecting_Severity: none
1067 #---------------------------------------------------------------------------
1068 # VM Compute Services
1069 #---------------------------------------------------------------------------
1072 Description: "Host <host_name> compute services failure[, reason = <reason_text>]"
1073 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1075 Alarm_Type: equipment
1076 Probable_Cause: unspecified-reason
1077 Service_Affecting: False
1082 Description: Host <host_name> compute services enabled
1083 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1085 Alarm_Type: equipment
1086 Probable_Cause: unspecified-reason
1087 Service_Affecting: False
1092 Description: Host <host_name> compute services disabled
1093 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1095 Alarm_Type: equipment
1096 Probable_Cause: unspecified-reason
1097 Service_Affecting: False
1103 Description: Host <host_name> hypervisor is now <administrative_state>-<operational_state>
1104 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1106 Alarm_Type: equipment
1107 Probable_Cause: unspecified-reason
1108 Service_Affecting: False
1112 #---------------------------------------------------------------------------
1114 #---------------------------------------------------------------------------
1118 Description: <subcloud> is offline
1119 Entity_Instance_ID: subcloud=<subcloud>
1121 Proposed_Repair_Action: Wait for subcloud to become online; if problem persists contact next level of support
1124 Alarm_Type: communication
1125 Probable_Cause: loss-of-signal
1126 Service_Affecting: False
1128 Management_Affecting_Severity: none
1129 Degrade_Affecting_Severity: none
1134 Description: <subcloud> <resource> sync_status is out-of-sync
1135 Entity_Instance_ID: [subcloud=<subcloud>.resource=<compute | network | platform | volumev2>]
1137 Proposed_Repair_Action: If problem persists contact next level of support
1141 Probable_Cause: application-subsystem-failure
1142 Service_Affecting: False
1144 Management_Affecting_Severity: none
1145 Degrade_Affecting_Severity: none
1150 Description: Subcloud backup failure
1151 Entity_Instance_ID: subcloud=<subcloud>
1153 Proposed_Repair_Action: Retry subcloud backup after checking backup input file. If problem persists, contact next level of support.
1156 Alarm_Type: processing-error
1157 Probable_Cause: unknown
1158 Service_Affecting: False
1160 Management_Affecting_Severity: none
1161 Degrade_Affecting_Severity: none
1167 Critical: Peer <peer_uuid> is in disconnected state. The following subcloud peer groups are impacted: <peer-groups>.
1168 Major: Peer <peer_uuid> connections in disconnected state.
1169 Entity_Instance_ID: |-
1171 Severity: [critical, major]
1172 Proposed_Repair_Action: "Check the connectivity between the current system and the reported peer site. If the peer system is down, migrate the affected peer group(s) to the current system for continued subcloud management."
1175 Alarm_Type: communication
1176 Probable_Cause: unknown
1177 Service_Affecting: False
1179 Management_Affecting_Severity: none
1180 Degrade_Affecting_Severity: none
1186 Subcloud peer group <peer_group_name> is managed by remote system <peer_uuid> with a lower priority.
1187 Entity_Instance_ID: peer_group=<peer_group_name>,peer=<peer_uuid>
1189 Proposed_Repair_Action: "Check the reported peer group state. Migrate it back to the current system if the state is 'rehomed' and the current system is stable. Otherwise, wait until these conditions are met."
1191 Inhibit_Alarms: False
1193 Probable_Cause: unknown
1194 Service_Affecting: False
1196 Management_Affecting_Severity: none
1197 Degrade_Affecting_Severity: none
1200 #---------------------------------------------------------------------------
1202 #---------------------------------------------------------------------------
1206 Description: "'Data' Port failed."
1207 Entity_Instance_ID: host=<hostname>.port=<port-uuid>
1209 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
1212 Alarm_Type: equipment
1213 Probable_Cause: loss-of-signal
1214 Service_Affecting: True
1216 Management_Affecting_Severity: warning
1217 Degrade_Affecting_Severity: none
1224 'Data' Interface degraded.
1226 'Data' Interface failed.
1227 Entity_Instance_ID: host=<hostname>.interface=<if-uuid>
1228 Severity: [critical, major]
1229 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
1232 Alarm_Type: equipment
1233 Probable_Cause: loss-of-signal
1234 Service_Affecting: True
1236 Management_Affecting_Severity: warning
1237 Degrade_Affecting_Severity: critical
1243 Description: Networking Agent not responding.
1244 Entity_Instance_ID: host=<hostname>.agent=<agent-uuid>
1246 Proposed_Repair_Action: "If condition persists, attempt to clear issue by administratively locking and unlocking the Host."
1249 Alarm_Type: operational-violation
1250 Probable_Cause: underlying-resource-unavailable
1251 Service_Affecting: True
1253 Management_Affecting_Severity: warning
1254 Degrade_Affecting_Severity: none
1260 Description: No enabled compute host with connectivity to provider network.
1261 Entity_Instance_ID: service=networking.providernet=<pnet-uuid>
1263 Proposed_Repair_Action: Enable compute hosts with required provider network connectivity.
1266 Alarm_Type: operational-violation
1267 Probable_Cause: underlying-resource-unavailable
1268 Service_Affecting: True
1270 Management_Affecting_Severity: warning
1271 Degrade_Affecting_Severity: none
1278 Communication failure detected over provider network x% for ranges y% on host z%.
1280 Communication failure detected over provider network x% on host z%.
1281 Entity_Instance_ID: host=<hostname>.service=networking.providernet=<pnet-uuid>
1283 Proposed_Repair_Action: Check neighbor switch port VLAN assignments.
1286 Alarm_Type: operational-violation
1287 Probable_Cause: underlying-resource-unavailable
1288 Service_Affecting: True
1290 Management_Affecting_Severity: warning
1291 Degrade_Affecting_Severity: none
1298 ML2 Driver Agent non-reachable
1300 ML2 Driver Agent reachable but non-responsive
1302 ML2 Driver Agent authentication failure
1304 ML2 Driver Agent is unable to sync Neutron database
1305 Entity_Instance_ID: host=<hostname>.ml2driver=<driver>
1307 Proposed_Repair_Action: "Monitor and if condition persists, contact next level of support."
1310 Alarm_Type: processing-error
1311 Probable_Cause: underlying-resource-unavailable
1312 Service_Affecting: True
1314 Management_Affecting_Severity: warning
1315 Degrade_Affecting_Severity: none
1321 Description: "Openflow Controller connection failed."
1322 Entity_Instance_ID: host=<hostname>.openflow-controller=<uri>
1324 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
1327 Alarm_Type: equipment
1328 Probable_Cause: loss-of-signal
1329 Service_Affecting: True
1331 Management_Affecting_Severity: warning
1332 Degrade_Affecting_Severity: critical
1339 No active Openflow controller connections found for this network.
1341 One or more Openflow controller connections in disconnected state for this network.
1342 Entity_Instance_ID: host=<hostname>.openflow-network=<name>
1343 Severity: [critical, major]
1344 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
1347 Alarm_Type: equipment
1348 Probable_Cause: loss-of-signal
1349 Service_Affecting: True
1351 Management_Affecting_Severity: warning
1352 Degrade_Affecting_Severity: critical
1358 Description: "OVSDB Manager connection failed."
1359 Entity_Instance_ID: host=<hostname>.sdn-controller=<uuid>
1361 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
1364 Alarm_Type: equipment
1365 Probable_Cause: loss-of-signal
1366 Service_Affecting: True
1368 Management_Affecting_Severity: warning
1369 Degrade_Affecting_Severity: critical
1375 Description: "No active OVSDB connections found."
1376 Entity_Instance_ID: host=<hostname>
1378 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
1381 Alarm_Type: equipment
1382 Probable_Cause: loss-of-signal
1383 Service_Affecting: True
1385 Management_Affecting_Severity: warning
1386 Degrade_Affecting_Severity: critical
1391 Description: "Dynamic routing agent x% lost connectivity to peer y%."
1392 Entity_Instance_ID: host=<hostname>,agent=<agent-uuid>,bgp-peer=<bgp-peer>
1394 Proposed_Repair_Action: If condition persists, fix connectivity to peer.
1397 Alarm_Type: operational-violation
1398 Probable_Cause: loss-of-signal
1399 Service_Affecting: True
1401 Management_Affecting_Severity: warning
1402 Degrade_Affecting_Severity: none
1406 #---------------------------------------------------------------------------
1408 #---------------------------------------------------------------------------
1413 Service group failure; <list of affected services>.
1415 Service group degraded; <list of affected services>.
1417 Service group warning; <list of affected services>.
1418 Entity_Instance_ID: service_domain=<domain_name>.service_group=<group_name>.host=<hostname>
1419 Severity: [critical, major, minor]
1420 Proposed_Repair_Action: Contact next level of support.
1422 Inhibit_Alarms: False
1423 Alarm_Type: processing-error
1424 Probable_Cause: underlying-resource-unavailable
1425 Service_Affecting: True
1427 Management_Affecting_Severity: warning
1428 Degrade_Affecting_Severity: major
1435 Service group loss of redundancy; expected <num> standby member<s> but only <num> standby member<s> available.
1437 Service group loss of redundancy; expected <num> standby member<s> but only <num> standby member<s> available.
1439 Service group loss of redundancy; expected <num> active member<s> but no active members available.
1441 Service group loss of redundancy; expected <num> active member<s> but only <num> active member<s> available.
1442 Entity_Instance_ID: service_domain=<domain_name>.service_group=<group_name>
1444 Proposed_Repair_Action: "Bring a controller node back in to service, otherwise contact next level of support."
1446 Inhibit_Alarms: False
1447 Alarm_Type: processing-error
1448 Probable_Cause: underlying-resource-unavailable
1449 Service_Affecting: True
1451 Management_Affecting_Severity: warning
1452 Degrade_Affecting_Severity: none
1459 License key is not installed; a valid license key is required for operation.
1461 License key has expired or is invalid; a valid license key is required for operation.
1463 Evaluation license key will expire on <date>; there are <num_days> days remaining in this evaluation.
1465 Evaluation license key will expire on <date>; there is only 1 day remaining in this evaluation.
1466 Entity_Instance_ID: host=<hostname>
1468 Proposed_Repair_Action: Contact next level of support to obtain a new license key.
1470 Inhibit_Alarms: False
1471 Alarm_Type: processing-error
1472 Probable_Cause: key-expired
1473 Service_Affecting: True
1475 Management_Affecting_Severity: critical
1476 Degrade_Affecting_Severity: none
1480 # 400.004: // NOTE Removed
1482 # Description: Service group software modification detected; <list of affected files>.
1483 # Entity_Instance_ID: host=<hostname>
1485 # Proposed_Repair_Action: Contact next level of support.
1486 # Maintenance_Action:
1487 # Inhibit_Alarms: False
1488 # Alarm_Type: processing-error
1489 # Probable_Cause: software-program-error
1490 # Service_Affecting: True
1491 # Suppression: False
1497 Communication failure detected with peer over port <linux-ifname>.
1499 Communication failure detected with peer over port <linux-ifname> within the last 30 seconds.
1500 Entity_Instance_ID: host=<hostname>.network=<mgmt | oam | cluster-host>
1502 Proposed_Repair_Action: Check cabling and far-end port configuration and status on adjacent equipment.
1504 Inhibit_Alarms: False
1505 Alarm_Type: communication
1506 Probable_Cause: underlying-resource-unavailable
1507 Service_Affecting: True
1509 Management_Affecting_Severity: warning
1510 Degrade_Affecting_Severity: none
1514 #---------------------------------------------------------------------------
1516 #---------------------------------------------------------------------------
1520 Description: Service group <group> state change from <state> to <state> on host <host_name>
1521 Entity_Instance_ID: service_domain=<domain>.service_group=<group>.host=<host_name>
1523 Alarm_Type: processing-error
1524 Probable_Cause: unspecified-reason
1525 Service_Affecting: True
1531 Service group <group> loss of redundancy; expected <X> standby member but no standby members available
1533 Service group <group> loss of redundancy; expected <X> standby member but only <Y> standby member(s) available
1535 Service group <group> has no active members available; expected <X> active member(s)
1537 Service group <group> loss of redundancy; expected <X> active member(s) but only <Y> active member(s) available
1538 Entity_Instance_ID: service_domain=<domain>.service_group=<group>
1540 Alarm_Type: processing-error
1541 Probable_Cause: unspecified-reason
1542 Service_Affecting: True
1548 License key has expired or is invalid
1550 Evaluation license key will expire on <date>
1552 License key is valid
1553 Entity_Instance_ID: host=<host_name>
1555 Alarm_Type: processing-error
1556 Probable_Cause: unspecified-reason
1557 Service_Affecting: True
1563 Communication failure detected with peer over port <port> on host <host name>
1565 Communication failure detected with peer over port <port> on host <host name> within the last <X> seconds
1567 Communication established with peer over port <port> on host <host name>
1568 Entity_Instance_ID: host=<host_name>.network=<network>
1570 Alarm_Type: processing-error
1571 Probable_Cause: unspecified-reason
1572 Service_Affecting: True
1577 Description: Swact or swact-force
1578 Entity_Instance_ID: host=<host_name>
1580 Alarm_Type: processing-error
1581 Probable_Cause: unspecified-reason
1582 Service_Affecting: True
1586 #---------------------------------------------------------------------------
1588 #---------------------------------------------------------------------------
1592 Description: TPM initialization failed on host.
1593 Entity_Instance_ID: host=<hostname>
1595 Proposed_Repair_Action: reinstall HTTPS certificate; if problem persists contact next level of support.
1596 Maintenance_Action: degrade
1598 Alarm_Type: equipment
1599 Probable_Cause: procedural-error
1600 Service_Affecting: True
1602 Management_Affecting_Severity: none
1603 Degrade_Affecting_Severity: none
1608 Description: Developer patch certificate enabled.
1609 Entity_Instance_ID: host=controller
1611 Proposed_Repair_Action: Reinstall system to disable developer certificate and remove untrusted patches.
1614 Alarm_Type: operational-violation
1615 Probable_Cause: unspecified-reason
1616 Service_Affecting: False
1618 Management_Affecting_Severity: none
1619 Degrade_Affecting_Severity: none
1625 Certificate 'system certificate-show <uuid>' (mode=<ssl/ssl_ca/docker_registry/openstack/openstack_ca>) expiring soon on <date>.
1627 Certificate '<Namespace>/<Certificate/Secret>' expiring soon on <date>.
1629 Certificate '<k8sRootCA/EtcdCA>' expiring soon on <date>.
1630 Entity_Instance_ID: |-
1631 system.certificate.mode=<mode>.uuid=<uuid>
1633 namespace=<namespace-name>.certificate=<certificate-name>
1635 namespace=<namespace-name>.secret=<secret-name>
1637 system.certificate.k8sRootCA
1639 Proposed_Repair_Action: Check certificate expiration time. Renew certificate for the entity identified.
1642 Alarm_Type: operational-violation
1643 Probable_Cause: certificate-expiration
1644 Service_Affecting: False
1646 Management_Affecting_Severity: none
1647 Degrade_Affecting_Severity: none
1653 Certificate 'system certificate-show <uuid>' (mode=<ssl/ssl_ca/docker_registry/openstack/openstack_ca>) expired.
1655 Certificate '<Namespace>/<Certificate/Secret>' expired.
1657 Certificate '<k8sRootCA/EtcdRootCA>' expired.
1658 Entity_Instance_ID: |-
1659 system.certificate.mode=<mode>.uuid=<uuid>
1661 namespace=<namespace-name>.certificate=<certificate-name>
1663 namespace=<namespace-name>.secret=<secret-name>
1665 system.certificate.k8sRootCA
1667 Proposed_Repair_Action: Check certificate expiration time. Renew certificate for the entity identified.
1670 Alarm_Type: operational-violation
1671 Probable_Cause: certificate-expiration
1672 Service_Affecting: False
1674 Management_Affecting_Severity: none
1675 Degrade_Affecting_Severity: none
1680 Description: "Host <host_name> has IMA Appraisal failure for service <service> when executing <file>, reason = <reason_text>]"
1681 Entity_Instance_ID: host=<hostname>.service=<service>
1683 Alarm_Type: integrity-violation
1684 Probable_Cause: information-modification-detected
1685 Service_Affecting: False
1689 #---------------------------------------------------------------------------
1691 #---------------------------------------------------------------------------
1696 Instance <instance_name> owned by <tenant_name> has failed on host <host_name>
1697 Instance <instance_name> owned by <tenant_name> has failed to schedule
1698 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1700 Proposed_Repair_Action: The system will attempt recovery; no repair action required
1703 Alarm_Type: processing-error
1704 Probable_Cause: software-error
1705 Service_Affecting: True
1707 Management_Affecting_Severity: warning
1708 Degrade_Affecting_Severity: none
1713 Description: Instance <instance_name> owned by <tenant_name> is paused on host <host_name>
1714 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1716 Proposed_Repair_Action: Un-pause the instance
1719 Alarm_Type: processing-error
1720 Probable_Cause: procedural-error
1721 Service_Affecting: True
1723 Management_Affecting_Severity: warning
1724 Degrade_Affecting_Severity: none
1729 Description: Instance <instance_name> owned by <tenant_name> is suspended on host <host_name>
1730 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1732 Proposed_Repair_Action: Resume the instance
1735 Alarm_Type: processing-error
1736 Probable_Cause: procedural-error
1737 Service_Affecting: True
1739 Management_Affecting_Severity: warning
1740 Degrade_Affecting_Severity: none
1745 Description: Instance <instance_name> owned by <tenant_name> is stopped on host <host_name>
1746 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1748 Proposed_Repair_Action: Start the instance
1751 Alarm_Type: processing-error
1752 Probable_Cause: procedural-error
1753 Service_Affecting: True
1755 Management_Affecting_Severity: warning
1756 Degrade_Affecting_Severity: none
1761 Description: Instance <instance_name> owned by <tenant_name> is rebooting on host <host_name>
1762 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1764 Proposed_Repair_Action: Wait for reboot to complete; if problem persists contact next level of support
1767 Alarm_Type: processing-error
1768 Probable_Cause: unspecified-reason
1769 Service_Affecting: True
1771 Management_Affecting_Severity: warning
1772 Degrade_Affecting_Severity: none
1777 Description: Instance <instance_name> owned by <tenant_name> is rebuilding on host <host_name>
1778 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1780 Proposed_Repair_Action: Wait for rebuild to complete; if problem persists contact next level of support
1783 Alarm_Type: processing-error
1784 Probable_Cause: underlying-resource-unavailable
1785 Service_Affecting: True
1787 Management_Affecting_Severity: warning
1788 Degrade_Affecting_Severity: none
1793 Description: Instance <instance_name> owned by <tenant_name> is evacuating from host <host_name>
1794 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1796 Proposed_Repair_Action: Wait for evacuate to complete; if problem persists contact next level of support
1799 Alarm_Type: processing-error
1800 Probable_Cause: underlying-resource-unavailable
1801 Service_Affecting: True
1803 Management_Affecting_Severity: warning
1804 Degrade_Affecting_Severity: none
1809 Description: Instance <instance_name> owned by <tenant_name> is live migrating from host <host_name>
1810 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1812 Proposed_Repair_Action: Wait for live migration to complete; if problem persists contact next level of support
1815 Alarm_Type: processing-error
1816 Probable_Cause: unspecified-reason
1817 Service_Affecting: True
1819 Management_Affecting_Severity: warning
1820 Degrade_Affecting_Severity: none
1825 Description: Instance <instance_name> owned by <tenant_name> is cold migrating from host <host_name>
1826 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1828 Proposed_Repair_Action: Wait for cold migration to complete; if problem persists contact next level of support
1831 Alarm_Type: processing-error
1832 Probable_Cause: unspecified-reason
1833 Service_Affecting: True
1835 Management_Affecting_Severity: warning
1836 Degrade_Affecting_Severity: none
1841 Description: Instance <instance_name> owned by <tenant_name> has been cold-migrated to host <host_name> waiting for confirmation
1842 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1844 Proposed_Repair_Action: Confirm or revert cold-migrate of instance
1847 Alarm_Type: processing-error
1848 Probable_Cause: unspecified-reason
1849 Service_Affecting: True
1851 Management_Affecting_Severity: warning
1852 Degrade_Affecting_Severity: none
1857 Description: Instance <instance_name> owned by <tenant_name> is reverting cold migrate to host <host_name>
1858 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1860 Proposed_Repair_Action: "Wait for cold migration revert to complete; if problem persists contact next level of support"
1864 Probable_Cause: unspecified-reason
1865 Service_Affecting: True
1867 Management_Affecting_Severity: warning
1868 Degrade_Affecting_Severity: none
1873 Description: Instance <instance_name> owned by <tenant_name> is resizing on host <host_name>
1874 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1876 Proposed_Repair_Action: Wait for resize to complete; if problem persists contact next level of support
1879 Alarm_Type: processing-error
1880 Probable_Cause: unspecified-reason
1881 Service_Affecting: True
1883 Management_Affecting_Severity: warning
1884 Degrade_Affecting_Severity: none
1889 Description: Instance <instance_name> owned by <tenant_name> has been resized on host <host_name> waiting for confirmation
1890 Entity_Instance_ID: itenant=<tenant-uuid>.instance=<instance-uuid>
1892 Proposed_Repair_Action: Confirm or revert resize of instance
1895 Alarm_Type: processing-error
1896 Probable_Cause: unspecified-reason
1897 Service_Affecting: True
1899 Management_Affecting_Severity: warning
1900 Degrade_Affecting_Severity: none
1905 Description: Instance <instance_name> owned by <tenant_name> is reverting resize on host <host_name>
1906 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1908 Proposed_Repair_Action: "Wait for resize revert to complete; if problem persists contact next level of support"
1912 Probable_Cause: unspecified-reason
1913 Service_Affecting: True
1915 Management_Affecting_Severity: warning
1916 Degrade_Affecting_Severity: none
1921 Description: Guest Heartbeat not established for instance <instance_name> owned by <tenant_name> on host <host_name>
1922 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1924 Proposed_Repair_Action: "Verify that the instance is running the Guest-Client daemon, or disable Guest Heartbeat for the instance if no longer needed, otherwise contact next level of support"
1927 Alarm_Type: communication
1928 Probable_Cause: procedural-error
1929 Service_Affecting: True
1931 Management_Affecting_Severity: warning
1932 Degrade_Affecting_Severity: none
1937 Description: Multi-Node Recovery Mode
1938 Entity_Instance_ID: subsystem=vim
1940 Proposed_Repair_Action: "Wait for the system to exit out of this mode"
1943 Alarm_Type: equipment
1944 Probable_Cause: unspecified-reason
1945 Service_Affecting: True
1947 Management_Affecting_Severity: warning
1948 Degrade_Affecting_Severity: none
1953 Description: Server group <server_group_name> <policy> policy was not satisfied
1954 Entity_Instance_ID: server-group<server-group-uuid>
1956 Proposed_Repair_Action: "Migrate instances in an attempt to satisfy the policy; if problem persists contact next level of support"
1959 Alarm_Type: processing-error
1960 Probable_Cause: procedural-error
1961 Service_Affecting: True
1963 Management_Affecting_Severity: none
1964 Degrade_Affecting_Severity: none
1970 Description: Instance <instance_name> is enabled on host <host_name>
1971 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1973 Alarm_Type: equipment
1974 Probable_Cause: unspecified-reason
1975 Service_Affecting: False
1980 Description: Instance <instance_name> owned by <tenant_name> has failed[, reason = <reason_text>]
1981 Instance <instance_name> owned by <tenant_name> has failed to schedule[, reason = <reason_text>]
1982 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1984 Alarm_Type: equipment
1985 Probable_Cause: unspecified-reason
1986 Service_Affecting: False
1991 Description: Create issued <by <tenant_name>|by the system> against <instance_name> owned by <tenant_name>
1992 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
1994 Alarm_Type: equipment
1995 Probable_Cause: unspecified-reason
1996 Service_Affecting: False
2001 Description: Creating instance <instance_name> owned by <tenant_name>
2002 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2004 Alarm_Type: equipment
2005 Probable_Cause: unspecified-reason
2006 Service_Affecting: False
2011 Description: "Create rejected for instance <instance_name>[, reason = <reason_text>]"
2012 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2014 Alarm_Type: equipment
2015 Probable_Cause: unspecified-reason
2016 Service_Affecting: False
2021 Description: "Create cancelled for instance <instance_name>[, reason = <reason_text>]"
2022 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2024 Alarm_Type: equipment
2025 Probable_Cause: unspecified-reason
2026 Service_Affecting: False
2031 Description: "Create failed for instance <instance_name>[, reason = <reason_text>]"
2032 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2034 Alarm_Type: equipment
2035 Probable_Cause: unspecified-reason
2036 Service_Affecting: False
2041 Description: Inance <instance_name> owned by <tenant_name> has been created
2042 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2044 Alarm_Type: equipment
2045 Probable_Cause: unspecified-reason
2046 Service_Affecting: False
2051 Description: "Delete issued <by tenant <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2052 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2054 Alarm_Type: equipment
2055 Probable_Cause: unspecified-reason
2056 Service_Affecting: False
2061 Description: Deleting instance <instance_name> owned by <tenant_name>
2062 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2064 Alarm_Type: equipment
2065 Probable_Cause: unspecified-reason
2066 Service_Affecting: False
2071 Description: "Delete rejected for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2072 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2074 Alarm_Type: equipment
2075 Probable_Cause: unspecified-reason
2076 Service_Affecting: False
2081 Description: "Delete cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2082 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2084 Alarm_Type: equipment
2085 Probable_Cause: unspecified-reason
2086 Service_Affecting: False
2091 Description: "Delete failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2092 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2094 Alarm_Type: equipment
2095 Probable_Cause: unspecified-reason
2096 Service_Affecting: False
2101 Description: Deleted instance <instance_name> owned by <tenant_name>
2102 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2104 Alarm_Type: equipment
2105 Probable_Cause: unspecified-reason
2106 Service_Affecting: False
2111 Description: "Pause issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2112 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2114 Alarm_Type: equipment
2115 Probable_Cause: unspecified-reason
2116 Service_Affecting: False
2121 Description: Pause in progress for instance <instance_name> on host <host_name>
2122 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2124 Alarm_Type: equipment
2125 Probable_Cause: unspecified-reason
2126 Service_Affecting: False
2131 Description: "Pause rejected for instance <instance_name> enabled on host <host_name>[, reason = <reason_text>]"
2132 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2134 Alarm_Type: equipment
2135 Probable_Cause: unspecified-reason
2136 Service_Affecting: False
2141 Description: "Pause cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2142 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2144 Alarm_Type: equipment
2145 Probable_Cause: unspecified-reason
2146 Service_Affecting: False
2151 Description: "Pause failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2152 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2154 Alarm_Type: equipment
2155 Probable_Cause: unspecified-reason
2156 Service_Affecting: False
2161 Description: Pause complete for instance <instance_name> now paused on host <host_name>
2162 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2164 Alarm_Type: equipment
2165 Probable_Cause: unspecified-reason
2166 Service_Affecting: False
2171 Description: "Un-pause issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2172 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2174 Alarm_Type: equipment
2175 Probable_Cause: unspecified-reason
2176 Service_Affecting: False
2181 Description: Un-pause in-progress for instance <instance_name> on host <host_name>
2182 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2184 Alarm_Type: equipment
2185 Probable_Cause: unspecified-reason
2186 Service_Affecting: False
2191 Description: "Un-pause rejected for instance <instance_name> paused on host <host_name>[, reason = <reason_text>]"
2192 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2194 Alarm_Type: equipment
2195 Probable_Cause: unspecified-reason
2196 Service_Affecting: False
2201 Description: "Un-pause cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2202 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2204 Alarm_Type: equipment
2205 Probable_Cause: unspecified-reason
2206 Service_Affecting: False
2211 Description: "Un-pause failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2212 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2214 Alarm_Type: equipment
2215 Probable_Cause: unspecified-reason
2216 Service_Affecting: False
2221 Description: Un-pause complete for instance <instance_name> now enabled on host <host_name>
2222 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2224 Alarm_Type: equipment
2225 Probable_Cause: unspecified-reason
2226 Service_Affecting: False
2231 Description: "Suspend issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2232 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2234 Alarm_Type: equipment
2235 Probable_Cause: unspecified-reason
2236 Service_Affecting: False
2241 Description: Suspend in-progress for instance <instance_name> on host <host_name>
2242 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2244 Alarm_Type: equipment
2245 Probable_Cause: unspecified-reason
2246 Service_Affecting: False
2251 Description: "Suspend rejected for instance <instance_name> enabled on host <host_name>[, reason = <reason_text>]"
2252 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2254 Alarm_Type: equipment
2255 Probable_Cause: unspecified-reason
2256 Service_Affecting: False
2261 Description: "Suspend cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2262 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2264 Alarm_Type: equipment
2265 Probable_Cause: unspecified-reason
2266 Service_Affecting: False
2271 Description: "Suspend failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2272 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2274 Alarm_Type: equipment
2275 Probable_Cause: unspecified-reason
2276 Service_Affecting: False
2281 Description: Suspend complete for instance <instance_name> now suspended on host <host_name>
2282 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2284 Alarm_Type: equipment
2285 Probable_Cause: unspecified-reason
2286 Service_Affecting: False
2291 Description: "Resume issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2292 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2294 Alarm_Type: equipment
2295 Probable_Cause: unspecified-reason
2296 Service_Affecting: False
2301 Description: Resume in-progress for instance <instance_name> on host <host_name>
2302 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2304 Alarm_Type: equipment
2305 Probable_Cause: unspecified-reason
2306 Service_Affecting: False
2311 Description: "Resume rejected for instance <instance_name> suspended on host <host_name>[, reason = <reason_text>]"
2312 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2314 Alarm_Type: equipment
2315 Probable_Cause: unspecified-reason
2316 Service_Affecting: False
2321 Description: "Resume cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2322 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2324 Alarm_Type: equipment
2325 Probable_Cause: unspecified-reason
2326 Service_Affecting: False
2331 Description: "Resume failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2332 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2334 Alarm_Type: equipment
2335 Probable_Cause: unspecified-reason
2336 Service_Affecting: False
2341 Description: Resume complete for instance <instance_name> now enabled on host <host_name>
2342 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2344 Alarm_Type: equipment
2345 Probable_Cause: unspecified-reason
2346 Service_Affecting: False
2351 Description: "Start issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2352 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2354 Alarm_Type: equipment
2355 Probable_Cause: unspecified-reason
2356 Service_Affecting: False
2361 Description: Start in-progress for instance <instance_name> on host <host_name>
2362 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2364 Alarm_Type: equipment
2365 Probable_Cause: unspecified-reason
2366 Service_Affecting: False
2371 Description: "Start rejected for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2372 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2374 Alarm_Type: equipment
2375 Probable_Cause: unspecified-reason
2376 Service_Affecting: False
2381 Description: "Start cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2382 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2384 Alarm_Type: equipment
2385 Probable_Cause: unspecified-reason
2386 Service_Affecting: False
2391 Description: "Start failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2392 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2394 Alarm_Type: equipment
2395 Probable_Cause: unspecified-reason
2396 Service_Affecting: False
2401 Description: Start complete for instance <instance_name> now enabled on host <host_name>
2402 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2404 Alarm_Type: equipment
2405 Probable_Cause: unspecified-reason
2406 Service_Affecting: False
2411 Description: "Stop issued <by <tenant_name>|by the system|by the instance> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2412 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2414 Alarm_Type: equipment
2415 Probable_Cause: unspecified-reason
2416 Service_Affecting: False
2421 Description: Stop in progress for instance <instance_name> on host <host_name>
2422 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2424 Alarm_Type: equipment
2425 Probable_Cause: unspecified-reason
2426 Service_Affecting: False
2431 Description: "Stop rejected for instance <instance_name> enabled on host <host_name>[, reason = <reason_text>]"
2432 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2434 Alarm_Type: equipment
2435 Probable_Cause: unspecified-reason
2436 Service_Affecting: False
2441 Description: "Stop cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2442 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2444 Alarm_Type: equipment
2445 Probable_Cause: unspecified-reason
2446 Service_Affecting: False
2451 Description: "Stop failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2452 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2454 Alarm_Type: equipment
2455 Probable_Cause: unspecified-reason
2456 Service_Affecting: False
2461 Description: Stop complete for instance <instance_name> now disabled on host <host_name>
2462 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2464 Alarm_Type: equipment
2465 Probable_Cause: unspecified-reason
2466 Service_Affecting: False
2471 Description: "Live-Migrate issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> from host <host_name>[, reason = <reason_text>]"
2472 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2474 Alarm_Type: equipment
2475 Probable_Cause: unspecified-reason
2476 Service_Affecting: False
2481 Description: Live-Migrate in progress for instance <instance_name> from host <host_name>
2482 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2484 Alarm_Type: equipment
2485 Probable_Cause: unspecified-reason
2486 Service_Affecting: False
2491 Description: "Live-Migrate rejected for instance <instance_name> now on host <host_name>[, reason = <reason_text>]"
2492 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2494 Alarm_Type: equipment
2495 Probable_Cause: unspecified-reason
2496 Service_Affecting: False
2501 Description: "Live-Migrate cancelled for instance <instance_name> now on host <host_name>[, reason = <reason_text>]"
2502 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2504 Alarm_Type: equipment
2505 Probable_Cause: unspecified-reason
2506 Service_Affecting: False
2511 Description: "Live-Migrate failed for instance <instance_name> now on host <host_name>[, reason = <reason_text>]"
2512 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2514 Alarm_Type: equipment
2515 Probable_Cause: unspecified-reason
2516 Service_Affecting: False
2521 Description: Live-Migrate complete for instance <instance_name> now enabled on host <host_name>
2522 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2524 Alarm_Type: equipment
2525 Probable_Cause: unspecified-reason
2526 Service_Affecting: False
2531 Description: "Cold-Migrate issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> from host <host_name>[, reason = <reason_text>]"
2532 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2534 Alarm_Type: equipment
2535 Probable_Cause: unspecified-reason
2536 Service_Affecting: False
2541 Description: Cold-Migrate in progress for instance <instance_name> from host <host_name>
2542 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2544 Alarm_Type: equipment
2545 Probable_Cause: unspecified-reason
2546 Service_Affecting: False
2551 Description: "Cold-Migrate rejected for instance <instance_name> now on host <host_name>[, reason = <reason_text>]"
2552 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2554 Alarm_Type: equipment
2555 Probable_Cause: unspecified-reason
2556 Service_Affecting: False
2561 Description: "Cold-Migrate cancelled for instance <instance_name> now on host <host_name>[, reason = <reason_text>]"
2562 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2564 Alarm_Type: equipment
2565 Probable_Cause: unspecified-reason
2566 Service_Affecting: False
2571 Description: "Cold-Migrate failed for instance <instance_name> now on host <host_name>[, reason = <reason_text>]"
2572 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2574 Alarm_Type: equipment
2575 Probable_Cause: unspecified-reason
2576 Service_Affecting: False
2581 Description: Cold-Migrate complete for instance <instance_name> now enabled on host <host_name>
2582 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2584 Alarm_Type: equipment
2585 Probable_Cause: unspecified-reason
2586 Service_Affecting: False
2591 Description: "Cold-Migrate-Confirm issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2592 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2594 Alarm_Type: equipment
2595 Probable_Cause: unspecified-reason
2596 Service_Affecting: False
2601 Description: Cold-Migrate-Confirm in progress for instance <instance_name> on host <host_name>
2602 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2604 Alarm_Type: equipment
2605 Probable_Cause: unspecified-reason
2606 Service_Affecting: False
2611 Description: "Cold-Migrate-Confirm rejected for instance <instance_name> now enabled on host <host_name>[, reason = <reason_text>]"
2612 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2614 Alarm_Type: equipment
2615 Probable_Cause: unspecified-reason
2616 Service_Affecting: False
2621 Description: "Cold-Migrate-Confirm cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2622 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2624 Alarm_Type: equipment
2625 Probable_Cause: unspecified-reason
2626 Service_Affecting: False
2631 Description: "Cold-Migrate-Confirm failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2632 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2634 Alarm_Type: equipment
2635 Probable_Cause: unspecified-reason
2636 Service_Affecting: False
2641 Description: Cold-Migrate-Confirm complete for instance <instance_name> enabled on host <host_name>
2642 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2644 Alarm_Type: equipment
2645 Probable_Cause: unspecified-reason
2646 Service_Affecting: False
2651 Description: "Cold-Migrate-Revert issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2652 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2654 Alarm_Type: equipment
2655 Probable_Cause: unspecified-reason
2656 Service_Affecting: False
2661 Description: Cold-Migrate-Revert in progress for instance <instance_name> from host <host_name>
2662 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2664 Alarm_Type: equipment
2665 Probable_Cause: unspecified-reason
2666 Service_Affecting: False
2671 Description: "Cold-Migrate-Revert rejected for instance <instance_name> now on host <host_name>[, reason = <reason_text>]"
2672 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2674 Alarm_Type: equipment
2675 Probable_Cause: unspecified-reason
2676 Service_Affecting: False
2681 Description: "Cold-Migrate-Revert cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2682 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2684 Alarm_Type: equipment
2685 Probable_Cause: unspecified-reason
2686 Service_Affecting: False
2691 Description: "Cold-Migrate-Revert failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2692 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2694 Alarm_Type: equipment
2695 Probable_Cause: unspecified-reason
2696 Service_Affecting: False
2701 Description: Cold-Migrate-Revert complete for instance <instance_name> now enabled on host <host_name>
2702 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2704 Alarm_Type: equipment
2705 Probable_Cause: unspecified-reason
2706 Service_Affecting: False
2711 Description: "Evacuate issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2712 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2714 Alarm_Type: equipment
2715 Probable_Cause: unspecified-reason
2716 Service_Affecting: False
2721 Description: Evacuating instance <instance_name> owned by <tenant_name> from host <host_name>
2722 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2724 Alarm_Type: equipment
2725 Probable_Cause: unspecified-reason
2726 Service_Affecting: False
2731 Description: "Evacuate rejected for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2732 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2734 Alarm_Type: equipment
2735 Probable_Cause: unspecified-reason
2736 Service_Affecting: False
2741 Description: "Evacuate cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2742 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2744 Alarm_Type: equipment
2745 Probable_Cause: unspecified-reason
2746 Service_Affecting: False
2751 Description: "Evacuate failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2752 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2754 Alarm_Type: equipment
2755 Probable_Cause: unspecified-reason
2756 Service_Affecting: False
2761 Description: Evacuate complete for instance <instance_name> now enabled on host <host_name>
2762 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2764 Alarm_Type: equipment
2765 Probable_Cause: unspecified-reason
2766 Service_Affecting: False
2771 Description: "Reboot <(soft-reboot)|(hard-reboot)> issued <by <tenant_name>|by the system|by the instance> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2772 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2774 Alarm_Type: equipment
2775 Probable_Cause: unspecified-reason
2776 Service_Affecting: False
2781 Description: Reboot in progress for instance <instance_name> on host <host_name>
2782 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2784 Alarm_Type: equipment
2785 Probable_Cause: unspecified-reason
2786 Service_Affecting: False
2791 Description: "Reboot rejected for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2792 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2794 Alarm_Type: equipment
2795 Probable_Cause: unspecified-reason
2796 Service_Affecting: False
2801 Description: "Reboot cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2802 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2804 Alarm_Type: equipment
2805 Probable_Cause: unspecified-reason
2806 Service_Affecting: False
2811 Description: "Reboot failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2812 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2814 Alarm_Type: equipment
2815 Probable_Cause: unspecified-reason
2816 Service_Affecting: False
2821 Description: Reboot complete for instance <instance_name> now enabled on host <host_name>
2822 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2824 Alarm_Type: equipment
2825 Probable_Cause: unspecified-reason
2826 Service_Affecting: False
2831 Description: "Rebuild issued <by <tenant_name>|by the system> against instance <instance_name> using image <image_name> on host <host_name>[, reason = <reason_text>]"
2832 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2834 Alarm_Type: equipment
2835 Probable_Cause: unspecified-reason
2836 Service_Affecting: False
2841 Description: Rebuild in progress for instance <instance_name> on host <host_name>
2842 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2844 Alarm_Type: equipment
2845 Probable_Cause: unspecified-reason
2846 Service_Affecting: False
2851 Description: "Rebuild rejected for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2852 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2854 Alarm_Type: equipment
2855 Probable_Cause: unspecified-reason
2856 Service_Affecting: False
2861 Description: "Rebuild cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2862 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2864 Alarm_Type: equipment
2865 Probable_Cause: unspecified-reason
2866 Service_Affecting: False
2871 Description: "Rebuild failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2872 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2874 Alarm_Type: equipment
2875 Probable_Cause: unspecified-reason
2876 Service_Affecting: False
2881 Description: Rebuild complete for instance <instance_name> now enabled on host <host_name>
2882 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2884 Alarm_Type: equipment
2885 Probable_Cause: unspecified-reason
2886 Service_Affecting: False
2891 Description: "Resize issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2892 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2894 Alarm_Type: equipment
2895 Probable_Cause: unspecified-reason
2896 Service_Affecting: False
2901 Description: Resize in progress for instance <instance_name> on host <host_name>
2902 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2904 Alarm_Type: equipment
2905 Probable_Cause: unspecified-reason
2906 Service_Affecting: False
2911 Description: "Resize rejected for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2912 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2914 Alarm_Type: equipment
2915 Probable_Cause: unspecified-reason
2916 Service_Affecting: False
2921 Description: "Resize cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2922 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2924 Alarm_Type: equipment
2925 Probable_Cause: unspecified-reason
2926 Service_Affecting: False
2931 Description: "Resize failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2932 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2934 Alarm_Type: equipment
2935 Probable_Cause: unspecified-reason
2936 Service_Affecting: False
2941 Description: Resize complete for instance <instance_name> enabled on host <host_name> waiting for confirmation
2942 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2944 Alarm_Type: equipment
2945 Probable_Cause: unspecified-reason
2946 Service_Affecting: False
2951 Description: "Resize-Confirm issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
2952 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2954 Alarm_Type: equipment
2955 Probable_Cause: unspecified-reason
2956 Service_Affecting: False
2961 Description: Resize-Confirm in progress for instance <instance_name> on host <host_name>
2962 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2964 Alarm_Type: equipment
2965 Probable_Cause: unspecified-reason
2966 Service_Affecting: False
2971 Description: "Resize-Confirm rejected for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2972 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2974 Alarm_Type: equipment
2975 Probable_Cause: unspecified-reason
2976 Service_Affecting: False
2981 Description: "Resize-Confirm cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2982 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2984 Alarm_Type: equipment
2985 Probable_Cause: unspecified-reason
2986 Service_Affecting: False
2991 Description: "Resize-Confirm failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
2992 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
2994 Alarm_Type: equipment
2995 Probable_Cause: unspecified-reason
2996 Service_Affecting: False
3001 Description: Resize-Confirm complete for instance <instance_name> enabled on host <host_name>
3002 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3004 Alarm_Type: equipment
3005 Probable_Cause: unspecified-reason
3006 Service_Affecting: False
3011 Description: "Resize-Revert issued <by <tenant_name>|by the system> against instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
3012 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3014 Alarm_Type: equipment
3015 Probable_Cause: unspecified-reason
3016 Service_Affecting: False
3021 Description: Resize-Revert in progress for instance <instance_name> on host <host_name>
3022 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3024 Alarm_Type: equipment
3025 Probable_Cause: unspecified-reason
3026 Service_Affecting: False
3031 Description: "Resize-Revert rejected for instance <instance_name> owned by <tenant_name> on host <host_name>[, reason = <reason_text>]"
3032 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3034 Alarm_Type: equipment
3035 Probable_Cause: unspecified-reason
3036 Service_Affecting: False
3041 Description: "Resize-Revert cancelled for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
3042 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3044 Alarm_Type: equipment
3045 Probable_Cause: unspecified-reason
3046 Service_Affecting: False
3051 Description: "Resize-Revert failed for instance <instance_name> on host <host_name>[, reason = <reason_text>]"
3052 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3054 Alarm_Type: equipment
3055 Probable_Cause: unspecified-reason
3056 Service_Affecting: False
3061 Description: Resize-Revert complete for instance <instance_name> enabled on host <host_name>
3062 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3064 Alarm_Type: equipment
3065 Probable_Cause: unspecified-reason
3066 Service_Affecting: False
3071 Description: Guest Heartbeat established for instance <instance_name> on host <host_name>
3072 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3074 Alarm_Type: equipment
3075 Probable_Cause: unspecified-reason
3076 Service_Affecting: False
3081 Description: Guest Heartbeat disconnected for instance <instance_name> on host <host_name>
3082 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3084 Alarm_Type: equipment
3085 Probable_Cause: unspecified-reason
3086 Service_Affecting: False
3091 Description: "Guest Heartbeat failed for instance <instance_name>[, reason = <reason_text>]"
3092 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3094 Alarm_Type: equipment
3095 Probable_Cause: unspecified-reason
3096 Service_Affecting: False
3101 Description: Instance <instance_name> has been renamed to <new_instance_name> owned by <tenant_name> on host <host_name>
3102 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3104 Alarm_Type: equipment
3105 Probable_Cause: unspecified-reason
3106 Service_Affecting: False
3111 Description: "Guest Health Check failed for instance <instance_name>[, reason = <reason_text>]"
3112 Entity_Instance_ID: tenant=<tenant-uuid>.instance=<instance-uuid>
3114 Alarm_Type: equipment
3115 Probable_Cause: unspecified-reason
3116 Service_Affecting: False
3121 Description: "Entered Multi-Node Recovery Mode"
3122 Entity_Instance_ID: subsystem=vim
3124 Alarm_Type: equipment
3125 Probable_Cause: unspecified-reason
3126 Service_Affecting: False
3132 Description: "Exited Multi-Node Recovery Mode"
3133 Entity_Instance_ID: subsystem=vim
3135 Alarm_Type: equipment
3136 Probable_Cause: unspecified-reason
3137 Service_Affecting: False
3140 #---------------------------------------------------------------------------
3142 #---------------------------------------------------------------------------
3146 Description: "Application Upload Failure"
3147 Entity_Instance_ID: k8s_application=<appname>
3149 Proposed_Repair_Action: "Check system inventory log for cause."
3152 Alarm_Type: processing-error
3153 Probable_Cause: unknown
3154 Service_Affecting: False
3156 Management_Affecting_Severity: none
3157 Degrade_Affecting_Severity: none
3162 Description: "Application Apply Failure"
3163 Entity_Instance_ID: k8s_application=<appname>
3165 Proposed_Repair_Action: "Retry applying the application. Check application is managed by the system application framework.
3166 If the issue persists, please check system inventory log for cause."
3169 Alarm_Type: processing-error
3170 Probable_Cause: unknown
3171 Service_Affecting: True
3173 Management_Affecting_Severity: none
3174 Degrade_Affecting_Severity: none
3179 Description: "Application Remove Failure"
3180 Entity_Instance_ID: k8s_application=<appname>
3182 Proposed_Repair_Action: "Retry removing the application. If the issue persists, please check system inventory log for cause."
3185 Alarm_Type: processing-error
3186 Probable_Cause: unknown
3187 Service_Affecting: True
3189 Management_Affecting_Severity: none
3190 Degrade_Affecting_Severity: none
3195 Description: "Application Apply In Progress"
3196 Entity_Instance_ID: k8s_application=<appname>
3198 Proposed_Repair_Action: "No action required."
3202 Probable_Cause: unknown
3203 Service_Affecting: True
3205 Management_Affecting_Severity: warning
3206 Degrade_Affecting_Severity: none
3211 Description: "Application Update In Progress"
3212 Entity_Instance_ID: k8s_application=<appname>
3214 Proposed_Repair_Action: "No action required."
3218 Probable_Cause: unknown
3219 Service_Affecting: True
3221 Management_Affecting_Severity: warning
3222 Degrade_Affecting_Severity: none
3227 Description: "Automatic Application Re-Apply Is Pending"
3228 Entity_Instance_ID: k8s_application=<appname>
3230 Proposed_Repair_Action: "Ensure all hosts are either locked or unlocked. When the system is stable the application will be automatically reapplied."
3234 Probable_Cause: unknown
3235 Service_Affecting: False
3237 Management_Affecting_Severity: none
3238 Degrade_Affecting_Severity: none
3241 #---------------------------------------------------------------------------
3243 #---------------------------------------------------------------------------
3248 Possible data loss. Any mds, mon or osd is unavailable in storage replication group.
3249 Entity_Instance_ID: cluster=<dist-fs-uuid>
3250 Severity: [critical, major]
3251 Proposed_Repair_Action: "Manually restart Ceph processes and check the state of the Ceph cluster with
3253 If problem persists, contact next level of support."
3256 Alarm_Type: equipment
3257 Probable_Cause: equipment-malfunction
3262 Management_Affecting_Severity: warning
3263 Degrade_Affecting_Severity: none
3269 Potential data loss. No available OSDs in storage replication group.
3270 Entity_Instance_ID: cluster=<dist-fs-uuid>.peergroup=<group-x>
3271 Severity: [critical]
3272 Proposed_Repair_Action: "Ensure storage hosts from replication group are unlocked and available.
3273 Check replication group state with 'system host-list'
3274 Check if OSDs of each storage host are up and running.
3275 Manually restart Ceph processes and check the state of the Ceph OSDs with
3276 'ceph osd stat' OR 'ceph osd tree'
3277 If problem persists, contact next level of support."
3280 Alarm_Type: equipment
3281 Probable_Cause: equipment-malfunction
3285 Management_Affecting_Severity: warning
3286 Degrade_Affecting_Severity: none
3292 Loss of replication in peergroup.
3293 Entity_Instance_ID: cluster=<dist-fs-uuid>.peergroup=<group-x>
3295 Proposed_Repair_Action: "Ensure storage hosts from replication group are unlocked and available.
3296 Check replication group state with 'system host-list'
3297 Check if OSDs of each storage host are up and running.
3298 Manually restart Ceph processes and check the state of the Ceph OSDs with
3299 'ceph osd stat' AND/OR 'ceph osd tree'
3300 If problem persists, contact next level of support."
3303 Alarm_Type: equipment
3304 Probable_Cause: equipment-malfunction
3308 Management_Affecting_Severity: warning
3309 Degrade_Affecting_Severity: none
3315 Image storage media is full: There is not enough disk space on the image storage media.
3317 Instance <instance name> snapshot failed: There is not enough disk space on the image storage media.
3319 Supplied <attrs> (<supplied>) and <attrs> generated from uploaded image (<actual>) did not match. Setting image status to 'killed'.
3321 Error in store configuration. Adding images to store is disabled.
3323 Forbidden upload attempt: <exception>.
3325 Insufficient permissions on image storage media: <exception>.
3327 Denying attempt to upload image larger than <size> bytes.
3329 Denying attempt to upload image because it exceeds the quota: <exception>.
3331 Received HTTP error while uploading image <image_id>.
3333 Client disconnected before sending all data to backend.
3335 Failed to upload image <image_id>.
3337 image=<image-uuid> instance=<instance-uuid>
3339 tenant=<tenant-uuid> instance=<instance-uuid>
3341 image=<image-uuid> instance=<instance-uuid>
3343 image=<image-uuid> instance=<instance-uuid>
3345 image=<image-uuid> instance=<instance-uuid>
3347 image=<image-uuid> instance=<instance-uuid>
3349 image=<image-uuid> instance=<instance-uuid>
3351 image=<image-uuid> instance=<instance-uuid>
3353 image=<image-uuid> instance=<instance-uuid>
3355 image=<image-uuid> instance=<instance-uuid>
3357 image=<image-uuid> instance=<instance-uuid>
3358 Alarm_Type: [physical-violation,
3360 integrity-violation,
3361 integrity-violation,
3362 security-service-or-mechanism-violation,
3363 security-service-or-mechanism-violation,
3364 security-service-or-mechanism-violation,
3365 security-service-or-mechanism-violation,
3368 operational-violation]
3370 Proposed_Repair_Action:
3373 Probable_Cause: unspecified-reason
3374 Service_Affecting: False
3376 Management_Affecting_Severity: none
3377 Degrade_Affecting_Severity: none
3383 Storage Alarm Condition:
3384 Cinder I/O Congestion is above normal range and is building
3385 Entity_Instance_ID: cinder_io_monitor
3387 Proposed_Repair_Action: "Reduce the I/O load on the Cinder LVM backend. Use
3388 Cinder QoS mechanisms on high usage volumes."
3392 Probable_Cause: congestion
3393 Service_Affecting: False
3395 Management_Affecting_Severity: none
3396 Degrade_Affecting_Severity: none
3402 Storage Alarm Condition:
3403 Cinder I/O Congestion is high and impacting guest performance
3404 Entity_Instance_ID: cinder_io_monitor
3406 Proposed_Repair_Action: "Reduce the I/O load on the Cinder LVM backend.
3407 Cinder actions may fail until congestion is reduced.
3408 Use Cinder QoS mechanisms on high usage volumes."
3412 Probable_Cause: congestion
3413 Service_Affecting: False
3415 Management_Affecting_Severity: warning
3416 Degrade_Affecting_Severity: none
3422 Storage Alarm Condition:
3423 <storage-backend-name> configuration failed to apply on host: <host-uuid>.
3424 Entity_Instance_ID: storage_backend=<storage-backend-name>
3426 Proposed_Repair_Action: "Update backend setting to reapply configuration.
3427 Use the following commands to try again:
3428 'system storage-backend-delete <storage-backend-name>'
3430 'system storage-backend-add <storage-backend-name>'
3431 See the |prod-long| documentation at |docs-url| for more details.
3432 If problem persists, contact next level of support."
3435 Alarm_Type: equipment
3436 Probable_Cause: configuration-or-customization-error
3437 Service_Affecting: True
3439 Management_Affecting_Severity: major
3440 Degrade_Affecting_Severity: none
3446 Filesystem Alarm Condition:
3447 <controllerfs_name> controller filesystem was not created/deleted successfully.
3448 Entity_Instance_ID: host=<hostname>.controllerfs=<controllerfs_name>
3450 Proposed_Repair_Action: "Use the create or delete command again:
3451 'system controllerfs-delete' or 'system controllerfs-add'.
3452 If problem persists, contact next level of support."
3455 Alarm_Type: processing-error
3456 Probable_Cause: unspecified-reason
3457 Service_Affecting: True
3459 Management_Affecting_Severity: major
3460 Degrade_Affecting_Severity: none
3463 #---------------------------------------------------------------------------
3465 #---------------------------------------------------------------------------
3469 Description: Persistent Volume Migration Error
3470 Entity_Instance_ID: kubernetes=PV-migration-failed
3472 Proposed_Repair_Action: "Manually execute /usr/bin/ceph_k8s_update_monitors.sh
3473 to confirm PVs are updated, then lock/unlock to clear
3474 alarms. If problem persists, contact next level of
3478 Alarm_Type: processing-error
3479 Probable_Cause: communication-subsystem-failure
3480 Service_Affecting: False
3482 Management_Affecting_Severity: none
3483 Degrade_Affecting_Severity: none
3488 Description: Kubernetes cluster unreachable
3489 Entity_Instance_ID: kubernetes=k8s-health-check-failed
3491 Proposed_Repair_Action: "If problem persists
3492 contact next level of support."
3495 Alarm_Type: communication
3496 Probable_Cause: out-of-service
3497 Service_Affecting: True
3499 Management_Affecting_Severity: major
3500 Degrade_Affecting_Severity: none
3503 #---------------------------------------------------------------------------
3505 #---------------------------------------------------------------------------
3509 Description: Patching operation in progress.
3510 Entity_Instance_ID: host=controller
3512 Proposed_Repair_Action: Complete reboots of affected hosts.
3515 Alarm_Type: environmental
3516 Probable_Cause: unspecified-reason
3517 Service_Affecting: False
3519 Management_Affecting_Severity: warning
3520 Degrade_Affecting_Severity: none
3525 Description: Patch host install failure. Command "sw-patch host-install" failed.
3526 Entity_Instance_ID: host=<hostname>
3528 Proposed_Repair_Action: Undo patching operation. Check patch logs on the target host (i.e. /var/log/patching.log)
3531 Alarm_Type: environmental
3532 Probable_Cause: unspecified-reason
3533 Service_Affecting: False
3535 Management_Affecting_Severity: warning
3536 Degrade_Affecting_Severity: none
3541 Description: A patch with state 'obsolete' in its metadata has been uploaded.
3542 Entity_Instance_ID: host=controller
3544 Proposed_Repair_Action: Remove and delete obsolete patches.
3547 Alarm_Type: environmental
3548 Probable_Cause: unspecified-reason
3549 Service_Affecting: False
3551 Management_Affecting_Severity: warning
3552 Degrade_Affecting_Severity: none
3557 Description: The upgrade and running software version do not match. Command host-upgrade failed.
3558 Entity_Instance_ID: host=<hostname>
3560 Proposed_Repair_Action: Reinstall host to update applied load.
3563 Alarm_Type: operational-violation
3564 Probable_Cause: unspecified-reason
3565 Service_Affecting: True
3567 Management_Affecting_Severity: warning
3568 Degrade_Affecting_Severity: none
3573 Description: System Upgrade in progress.
3574 Entity_Instance_ID: host=controller
3576 Proposed_Repair_Action: No action required.
3579 Alarm_Type: operational-violation
3580 Probable_Cause: unspecified-reason
3581 Service_Affecting: False
3583 Management_Affecting_Severity: warning
3584 Degrade_Affecting_Severity: none
3589 Description: Device image update operation in progress.
3590 Entity_Instance_ID: host=controller
3592 Proposed_Repair_Action: Complete reboots of affected hosts.
3595 Alarm_Type: environmental
3596 Probable_Cause: unspecified-reason
3597 Service_Affecting: False
3599 Management_Affecting_Severity: warning
3600 Degrade_Affecting_Severity: none
3605 Description: Kubernetes upgrade in progress.
3606 Entity_Instance_ID: host=controller
3608 Proposed_Repair_Action: No action required.
3611 Alarm_Type: operational-violation
3612 Probable_Cause: unspecified-reason
3613 Service_Affecting: False
3615 Management_Affecting_Severity: warning
3616 Degrade_Affecting_Severity: none
3621 Description: Kubernetes rootca update in progress
3622 Entity_Instance_ID: host=controller
3624 Proposed_Repair_Action: Wait for kubernetes rootca procedure to complete
3627 Alarm_Type: operational-violation
3628 Probable_Cause: unspecified-reason
3629 Service_Affecting: False
3631 Management_Affecting_Severity: warning
3632 Degrade_Affecting_Severity: none
3637 Description: Kubernetes root CA update aborted, certificates may not be fully updated. Command "system kube-rootca-update-abort" has been run.
3638 Entity_Instance_ID: host=controller
3640 Proposed_Repair_Action: Fully update certificates by a new root CA update.
3643 Alarm_Type: operational-violation
3644 Probable_Cause: unspecified-reason
3645 Service_Affecting: False
3647 Management_Affecting_Severity: warning
3648 Degrade_Affecting_Severity: none
3653 Description: System Config update in progress
3654 Entity_Instance_ID: host=controller
3656 Proposed_Repair_Action: Wait for system config update to complete
3659 Alarm_Type: operational-violation
3660 Probable_Cause: unspecified-reason
3661 Service_Affecting: False
3663 Management_Affecting_Severity: warning
3664 Degrade_Affecting_Severity: none
3669 Description: System Config update aborted, configurations may not be fully updated
3670 Entity_Instance_ID: host=<hostname>
3672 Proposed_Repair_Action: Lock the host, wait for the host resource in the deployment namespace to become in-sync, then unlock the host
3675 Alarm_Type: operational-violation
3676 Probable_Cause: unspecified-reason
3677 Service_Affecting: False
3679 Management_Affecting_Severity: warning
3680 Degrade_Affecting_Severity: none
3685 Description: Deploy host completed with success
3686 Entity_Instance_ID: host=<hostname>
3688 Proposed_Repair_Action: Unlock host
3691 Alarm_Type: equipment
3692 Probable_Cause: unspecified-reason
3693 Service_Affecting: False
3695 Management_Affecting_Severity: none
3696 Degrade_Affecting_Severity: none
3701 Description: Deploy host failed
3702 Entity_Instance_ID: host=<hostname>
3704 Proposed_Repair_Action: Check the logs for errors, fix the issues manually and retry
3707 Alarm_Type: equipment
3708 Probable_Cause: unspecified-reason
3709 Service_Affecting: True
3711 Management_Affecting_Severity: warning
3712 Degrade_Affecting_Severity: none
3717 Description: Software patch auto-apply in progress
3718 Entity_Instance_ID: orchestration=sw-patch
3720 Proposed_Repair_Action: Wait for software patch auto-apply to complete; if problem persists contact next level of support
3723 Alarm_Type: equipment
3724 Probable_Cause: unspecified-reason
3725 Service_Affecting: True
3727 Management_Affecting_Severity: warning
3728 Degrade_Affecting_Severity: none
3733 Description: Software patch auto-apply aborting
3734 Entity_Instance_ID: orchestration=sw-patch
3736 Proposed_Repair_Action: Wait for software patch auto-apply abort to complete; if problem persists contact next level of support
3739 Alarm_Type: equipment
3740 Probable_Cause: unspecified-reason
3741 Service_Affecting: True
3743 Management_Affecting_Severity: warning
3744 Degrade_Affecting_Severity: none
3749 Description: Software patch auto-apply failed. Command "sw-manager patch-strategy apply" failed.
3750 Entity_Instance_ID: orchestration=sw-patch
3752 Proposed_Repair_Action: Attempt to apply software patches manually; if problem persists contact next level of support
3755 Alarm_Type: equipment
3756 Probable_Cause: underlying-resource-unavailable
3757 Service_Affecting: True
3759 Management_Affecting_Severity: warning
3760 Degrade_Affecting_Severity: none
3765 Description: Software patch auto-apply start
3766 Entity_Instance_ID: orchestration=sw-patch
3768 Alarm_Type: equipment
3769 Probable_Cause: unspecified-reason
3770 Service_Affecting: False
3775 Description: Software patch auto-apply in progress
3776 Entity_Instance_ID: orchestration=sw-patch
3778 Alarm_Type: equipment
3779 Probable_Cause: unspecified-reason
3780 Service_Affecting: False
3785 Description: Software patch auto-apply rejected
3786 Entity_Instance_ID: orchestration=sw-patch
3788 Alarm_Type: equipment
3789 Probable_Cause: unspecified-reason
3790 Service_Affecting: False
3795 Description: Software patch auto-apply cancelled
3796 Entity_Instance_ID: orchestration=sw-patch
3798 Alarm_Type: equipment
3799 Probable_Cause: unspecified-reason
3800 Service_Affecting: False
3805 Description: Software patch auto-apply failed
3806 Entity_Instance_ID: orchestration=sw-patch
3808 Alarm_Type: equipment
3809 Probable_Cause: unspecified-reason
3810 Service_Affecting: False
3815 Description: Software patch auto-apply completed
3816 Entity_Instance_ID: orchestration=sw-patch
3818 Alarm_Type: equipment
3819 Probable_Cause: unspecified-reason
3820 Service_Affecting: False
3825 Description: Software patch auto-apply abort
3826 Entity_Instance_ID: orchestration=sw-patch
3828 Alarm_Type: equipment
3829 Probable_Cause: unspecified-reason
3830 Service_Affecting: False
3835 Description: Software patch auto-apply aborting
3836 Entity_Instance_ID: orchestration=sw-patch
3838 Alarm_Type: equipment
3839 Probable_Cause: unspecified-reason
3840 Service_Affecting: False
3845 Description: Software patch auto-apply abort rejected
3846 Entity_Instance_ID: orchestration=sw-patch
3848 Alarm_Type: equipment
3849 Probable_Cause: unspecified-reason
3850 Service_Affecting: False
3855 Description: Software patch auto-apply abort failed
3856 Entity_Instance_ID: orchestration=sw-patch
3858 Alarm_Type: equipment
3859 Probable_Cause: unspecified-reason
3860 Service_Affecting: False
3865 Description: Software patch auto-apply aborted
3866 Entity_Instance_ID: orchestration=sw-patch
3868 Alarm_Type: equipment
3869 Probable_Cause: unspecified-reason
3870 Service_Affecting: False
3875 Description: Software upgrade auto-apply in progress
3876 Entity_Instance_ID: orchestration=sw-upgrade
3878 Proposed_Repair_Action: Wait for software upgrade auto-apply to complete; if problem persists contact next level of support
3881 Alarm_Type: equipment
3882 Probable_Cause: unspecified-reason
3883 Service_Affecting: True
3885 Management_Affecting_Severity: warning
3886 Degrade_Affecting_Severity: none
3891 Description: Software upgrade auto-apply aborting
3892 Entity_Instance_ID: orchestration=sw-upgrade
3894 Proposed_Repair_Action: Wait for software upgrade auto-apply abort to complete; if problem persists contact next level of support
3897 Alarm_Type: equipment
3898 Probable_Cause: unspecified-reason
3899 Service_Affecting: True
3901 Management_Affecting_Severity: warning
3902 Degrade_Affecting_Severity: none
3907 Description: Software upgrade auto-apply failed. Command "sw-manager update-strategy apply" failed
3908 Entity_Instance_ID: orchestration=sw-upgrade
3910 Proposed_Repair_Action: Attempt to apply software upgrade manually; if problem persists contact next level of support
3913 Alarm_Type: equipment
3914 Probable_Cause: underlying-resource-unavailable
3915 Service_Affecting: True
3917 Management_Affecting_Severity: warning
3918 Degrade_Affecting_Severity: none
3923 Description: Software upgrade auto-apply start
3924 Entity_Instance_ID: orchestration=sw-upgrade
3926 Alarm_Type: equipment
3927 Probable_Cause: unspecified-reason
3928 Service_Affecting: False
3933 Description: Software upgrade auto-apply in progress
3934 Entity_Instance_ID: orchestration=sw-upgrade
3936 Alarm_Type: equipment
3937 Probable_Cause: unspecified-reason
3938 Service_Affecting: False
3943 Description: Software upgrade auto-apply rejected
3944 Entity_Instance_ID: orchestration=sw-upgrade
3946 Alarm_Type: equipment
3947 Probable_Cause: unspecified-reason
3948 Service_Affecting: False
3953 Description: Software upgrade auto-apply cancelled
3954 Entity_Instance_ID: orchestration=sw-upgrade
3956 Alarm_Type: equipment
3957 Probable_Cause: unspecified-reason
3958 Service_Affecting: False
3963 Description: Software upgrade auto-apply failed
3964 Entity_Instance_ID: orchestration=sw-upgrade
3966 Alarm_Type: equipment
3967 Probable_Cause: unspecified-reason
3968 Service_Affecting: False
3973 Description: Software upgrade auto-apply completed
3974 Entity_Instance_ID: orchestration=sw-upgrade
3976 Alarm_Type: equipment
3977 Probable_Cause: unspecified-reason
3978 Service_Affecting: False
3983 Description: Software upgrade auto-apply abort
3984 Entity_Instance_ID: orchestration=sw-upgrade
3986 Alarm_Type: equipment
3987 Probable_Cause: unspecified-reason
3988 Service_Affecting: False
3993 Description: Software upgrade auto-apply aborting
3994 Entity_Instance_ID: orchestration=sw-upgrade
3996 Alarm_Type: equipment
3997 Probable_Cause: unspecified-reason
3998 Service_Affecting: False
4003 Description: Software upgrade auto-apply abort rejected
4004 Entity_Instance_ID: orchestration=sw-upgrade
4006 Alarm_Type: equipment
4007 Probable_Cause: unspecified-reason
4008 Service_Affecting: False
4013 Description: Software upgrade auto-apply abort failed
4014 Entity_Instance_ID: orchestration=sw-upgrade
4016 Alarm_Type: equipment
4017 Probable_Cause: unspecified-reason
4018 Service_Affecting: False
4023 Description: Software upgrade auto-apply aborted
4024 Entity_Instance_ID: orchestration=sw-upgrade
4026 Alarm_Type: equipment
4027 Probable_Cause: unspecified-reason
4028 Service_Affecting: False
4033 Description: Software deploy state out of sync
4034 Entity_Instance_ID: orchestration=sw-upgrade
4036 Proposed_Repair_Action: Wait for the deployment on the active controller to complete. If problem persists contact next level of support
4039 Alarm_Type: equipment
4040 Probable_Cause: unspecified-reason
4041 Service_Affecting: True
4043 Management_Affecting_Severity: warning
4044 Degrade_Affecting_Severity: none
4049 Description: Firmware Update auto-apply in progress
4050 Entity_Instance_ID: orchestration=fw-update
4052 Proposed_Repair_Action: Wait for firmware update auto-apply to complete; if problem persists contact next level of support
4055 Alarm_Type: equipment
4056 Probable_Cause: unspecified-reason
4057 Service_Affecting: True
4059 Management_Affecting_Severity: warning
4060 Degrade_Affecting_Severity: none
4065 Description: Firmware Update auto-apply aborting
4066 Entity_Instance_ID: orchestration=fw-update
4068 Proposed_Repair_Action: Wait for firmware update auto-apply abort to complete; if problem persists contact next level of support
4071 Alarm_Type: equipment
4072 Probable_Cause: unspecified-reason
4073 Service_Affecting: True
4075 Management_Affecting_Severity: warning
4076 Degrade_Affecting_Severity: none
4081 Description: Firmware Update auto-apply failed. Command "sw-manager kube-rootca-update-strategy apply" failed.
4082 Entity_Instance_ID: orchestration=fw-update
4084 Proposed_Repair_Action: Attempt to apply firmware update manually; if problem persists contact next level of support
4087 Alarm_Type: equipment
4088 Probable_Cause: underlying-resource-unavailable
4089 Service_Affecting: True
4091 Management_Affecting_Severity: warning
4092 Degrade_Affecting_Severity: none
4097 Description: Firmware update auto-apply start
4098 Entity_Instance_ID: orchestration=fw-update
4100 Alarm_Type: equipment
4101 Probable_Cause: unspecified-reason
4102 Service_Affecting: False
4107 Description: Firmware update auto-apply in progress
4108 Entity_Instance_ID: orchestration=fw-update
4110 Alarm_Type: equipment
4111 Probable_Cause: unspecified-reason
4112 Service_Affecting: False
4117 Description: Firmware update auto-apply rejected
4118 Entity_Instance_ID: orchestration=fw-update
4120 Alarm_Type: equipment
4121 Probable_Cause: unspecified-reason
4122 Service_Affecting: False
4127 Description: Firmware update auto-apply cancelled
4128 Entity_Instance_ID: orchestration=fw-update
4130 Alarm_Type: equipment
4131 Probable_Cause: unspecified-reason
4132 Service_Affecting: False
4137 Description: Firmware update auto-apply failed
4138 Entity_Instance_ID: orchestration=fw-update
4140 Alarm_Type: equipment
4141 Probable_Cause: unspecified-reason
4142 Service_Affecting: False
4147 Description: Firmware update auto-apply completed
4148 Entity_Instance_ID: orchestration=fw-update
4150 Alarm_Type: equipment
4151 Probable_Cause: unspecified-reason
4152 Service_Affecting: False
4157 Description: Firmware update auto-apply abort
4158 Entity_Instance_ID: orchestration=fw-update
4160 Alarm_Type: equipment
4161 Probable_Cause: unspecified-reason
4162 Service_Affecting: False
4167 Description: Firmware update auto-apply aborting
4168 Entity_Instance_ID: orchestration=fw-update
4170 Alarm_Type: equipment
4171 Probable_Cause: unspecified-reason
4172 Service_Affecting: False
4177 Description: Firmware update auto-apply abort rejected
4178 Entity_Instance_ID: orchestration=fw-update
4180 Alarm_Type: equipment
4181 Probable_Cause: unspecified-reason
4182 Service_Affecting: False
4187 Description: Firmware update auto-apply abort failed
4188 Entity_Instance_ID: orchestration=fw-update
4190 Alarm_Type: equipment
4191 Probable_Cause: unspecified-reason
4192 Service_Affecting: False
4197 Description: Firmware update auto-apply aborted
4198 Entity_Instance_ID: orchestration=fw-update
4200 Alarm_Type: equipment
4201 Probable_Cause: unspecified-reason
4202 Service_Affecting: False
4207 Description: Kubernetes upgrade auto-apply in progress
4208 Entity_Instance_ID: orchestration=kube-upgrade
4210 Proposed_Repair_Action: Wait for kubernetes upgrade auto-apply to complete; if problem persists contact next level of support
4213 Alarm_Type: equipment
4214 Probable_Cause: unspecified-reason
4215 Service_Affecting: True
4217 Management_Affecting_Severity: warning
4218 Degrade_Affecting_Severity: none
4223 Description: Kubernetes upgrade auto-apply aborting
4224 Entity_Instance_ID: orchestration=kube-upgrade
4226 Proposed_Repair_Action: Wait for kubernetes upgrade auto-apply abort to complete; if problem persists contact next level of support
4229 Alarm_Type: equipment
4230 Probable_Cause: unspecified-reason
4231 Service_Affecting: True
4233 Management_Affecting_Severity: warning
4234 Degrade_Affecting_Severity: none
4239 Description: Kubernetes upgrade auto-apply failed
4240 Entity_Instance_ID: orchestration=kube-upgrade
4242 Proposed_Repair_Action: Attempt to apply kubernetes upgrade manually; if problem persists contact next level of support
4245 Alarm_Type: equipment
4246 Probable_Cause: underlying-resource-unavailable
4247 Service_Affecting: True
4249 Management_Affecting_Severity: warning
4250 Degrade_Affecting_Severity: none
4255 Description: Kubernetes upgrade auto-apply start
4256 Entity_Instance_ID: orchestration=kube-upgrade
4258 Alarm_Type: equipment
4259 Probable_Cause: unspecified-reason
4260 Service_Affecting: False
4265 Description: Kubernetes upgrade auto-apply in progress
4266 Entity_Instance_ID: orchestration=kube-upgrade
4268 Alarm_Type: equipment
4269 Probable_Cause: unspecified-reason
4270 Service_Affecting: False
4275 Description: Kubernetes upgrade auto-apply rejected
4276 Entity_Instance_ID: orchestration=kube-upgrade
4278 Alarm_Type: equipment
4279 Probable_Cause: unspecified-reason
4280 Service_Affecting: False
4285 Description: Kubernetes upgrade auto-apply cancelled
4286 Entity_Instance_ID: orchestration=kube-upgrade
4288 Alarm_Type: equipment
4289 Probable_Cause: unspecified-reason
4290 Service_Affecting: False
4295 Description: Kubernetes upgrade auto-apply failed
4296 Entity_Instance_ID: orchestration=kube-upgrade
4298 Alarm_Type: equipment
4299 Probable_Cause: unspecified-reason
4300 Service_Affecting: False
4305 Description: Kubernetes upgrade auto-apply completed
4306 Entity_Instance_ID: orchestration=kube-upgrade
4308 Alarm_Type: equipment
4309 Probable_Cause: unspecified-reason
4310 Service_Affecting: False
4315 Description: Kubernetes upgrade auto-apply abort
4316 Entity_Instance_ID: orchestration=kube-upgrade
4318 Alarm_Type: equipment
4319 Probable_Cause: unspecified-reason
4320 Service_Affecting: False
4325 Description: Kubernetes upgrade auto-apply aborting
4326 Entity_Instance_ID: orchestration=kube-upgrade
4328 Alarm_Type: equipment
4329 Probable_Cause: unspecified-reason
4330 Service_Affecting: False
4335 Description: Kubernetes upgrade auto-apply abort rejected
4336 Entity_Instance_ID: orchestration=kube-upgrade
4338 Alarm_Type: equipment
4339 Probable_Cause: unspecified-reason
4340 Service_Affecting: False
4345 Description: Kubernetes upgrade auto-apply abort failed
4346 Entity_Instance_ID: orchestration=kube-upgrade
4348 Alarm_Type: equipment
4349 Probable_Cause: unspecified-reason
4350 Service_Affecting: False
4355 Description: Kubernetes upgrade auto-apply aborted
4356 Entity_Instance_ID: orchestration=kube-upgrade
4358 Alarm_Type: equipment
4359 Probable_Cause: unspecified-reason
4360 Service_Affecting: False
4365 Description: Kubernetes rootca update auto-apply in progress
4366 Entity_Instance_ID: orchestration=kube-rootca-update
4368 Proposed_Repair_Action: Wait for kubernetes rootca update auto-apply to complete; if problem persists contact next level of support
4371 Alarm_Type: equipment
4372 Probable_Cause: unspecified-reason
4373 Service_Affecting: True
4375 Management_Affecting_Severity: warning
4376 Degrade_Affecting_Severity: none
4381 Description: Kubernetes rootca update auto-apply aborting
4382 Entity_Instance_ID: orchestration=kube-rootca-update
4384 Proposed_Repair_Action: Wait for kubernetes rootca update auto-apply abort to complete; if problem persists contact next level of support
4387 Alarm_Type: equipment
4388 Probable_Cause: unspecified-reason
4389 Service_Affecting: True
4391 Management_Affecting_Severity: warning
4392 Degrade_Affecting_Severity: none
4397 Description: Kubernetes rootca update auto-apply failed. Command "sw-manager kube-upgrade-strategy apply" failed.
4398 Entity_Instance_ID: orchestration=kube-rootca-update
4400 Proposed_Repair_Action: Attempt to apply kubernetes rootca update manually; if problem persists contact next level of support
4403 Alarm_Type: equipment
4404 Probable_Cause: underlying-resource-unavailable
4405 Service_Affecting: True
4407 Management_Affecting_Severity: warning
4408 Degrade_Affecting_Severity: none
4413 Description: Kubernetes rootca update auto-apply start
4414 Entity_Instance_ID: orchestration=kube-rootca-update
4416 Alarm_Type: equipment
4417 Probable_Cause: unspecified-reason
4418 Service_Affecting: False
4423 Description: Kubernetes rootca update auto-apply in progress
4424 Entity_Instance_ID: orchestration=kube-rootca-update
4426 Alarm_Type: equipment
4427 Probable_Cause: unspecified-reason
4428 Service_Affecting: False
4433 Description: Kubernetes rootca update auto-apply rejected
4434 Entity_Instance_ID: orchestration=kube-rootca-update
4436 Alarm_Type: equipment
4437 Probable_Cause: unspecified-reason
4438 Service_Affecting: False
4443 Description: Kubernetes rootca update auto-apply cancelled
4444 Entity_Instance_ID: orchestration=kube-rootca-update
4446 Alarm_Type: equipment
4447 Probable_Cause: unspecified-reason
4448 Service_Affecting: False
4453 Description: Kubernetes rootca update auto-apply failed
4454 Entity_Instance_ID: orchestration=kube-rootca-update
4456 Alarm_Type: equipment
4457 Probable_Cause: unspecified-reason
4458 Service_Affecting: False
4463 Description: Kubernetes rootca update auto-apply completed
4464 Entity_Instance_ID: orchestration=kube-rootca-update
4466 Alarm_Type: equipment
4467 Probable_Cause: unspecified-reason
4468 Service_Affecting: False
4473 Description: Kubernetes rootca update auto-apply abort
4474 Entity_Instance_ID: orchestration=kube-rootca-update
4476 Alarm_Type: equipment
4477 Probable_Cause: unspecified-reason
4478 Service_Affecting: False
4483 Description: Kubernetes rootca update auto-apply aborting
4484 Entity_Instance_ID: orchestration=kube-rootca-update
4486 Alarm_Type: equipment
4487 Probable_Cause: unspecified-reason
4488 Service_Affecting: False
4493 Description: Kubernetes rootca update auto-apply abort rejected
4494 Entity_Instance_ID: orchestration=kube-rootca-update
4496 Alarm_Type: equipment
4497 Probable_Cause: unspecified-reason
4498 Service_Affecting: False
4503 Description: Kubernetes rootca update auto-apply abort failed
4504 Entity_Instance_ID: orchestration=kube-rootca-update
4506 Alarm_Type: equipment
4507 Probable_Cause: unspecified-reason
4508 Service_Affecting: False
4513 Description: Kubernetes rootca update auto-apply aborted
4514 Entity_Instance_ID: orchestration=kube-rootca-update
4516 Alarm_Type: equipment
4517 Probable_Cause: unspecified-reason
4518 Service_Affecting: False
4523 Description: System config update auto-apply in progress
4524 Entity_Instance_ID: orchestration=system-config-update
4526 Proposed_Repair_Action: Wait for system config update auto-apply to complete; if problem persists contact next level of support
4529 Alarm_Type: equipment
4530 Probable_Cause: unspecified-reason
4531 Service_Affecting: True
4533 Management_Affecting_Severity: warning
4534 Degrade_Affecting_Severity: none
4539 Description: System config update auto-apply aborting
4540 Entity_Instance_ID: orchestration=system-config-update
4542 Proposed_Repair_Action: Wait for system config update auto-apply abort to complete; if problem persists contact next level of support
4545 Alarm_Type: equipment
4546 Probable_Cause: unspecified-reason
4547 Service_Affecting: True
4549 Management_Affecting_Severity: warning
4550 Degrade_Affecting_Severity: none
4555 Description: System config update auto-apply failed. Command "sw-manager kube-upgrade-strategy apply" failed
4556 Entity_Instance_ID: orchestration=system-config-update
4558 Proposed_Repair_Action: Attempt to apply system config update manually; if problem persists contact next level of support
4561 Alarm_Type: equipment
4562 Probable_Cause: underlying-resource-unavailable
4563 Service_Affecting: True
4565 Management_Affecting_Severity: warning
4566 Degrade_Affecting_Severity: none
4571 Description: System config update auto-apply start
4572 Entity_Instance_ID: orchestration=system-config-update
4574 Alarm_Type: equipment
4575 Probable_Cause: unspecified-reason
4576 Service_Affecting: False
4581 Description: System config update auto-apply in progress
4582 Entity_Instance_ID: orchestration=system-config-update
4584 Alarm_Type: equipment
4585 Probable_Cause: unspecified-reason
4586 Service_Affecting: False
4591 Description: System config update auto-apply rejected
4592 Entity_Instance_ID: orchestration=system-config-update
4594 Alarm_Type: equipment
4595 Probable_Cause: unspecified-reason
4596 Service_Affecting: False
4601 Description: System config update auto-apply cancelled
4602 Entity_Instance_ID: orchestration=system-config-update
4604 Alarm_Type: equipment
4605 Probable_Cause: unspecified-reason
4606 Service_Affecting: False
4611 Description: System config update auto-apply failed
4612 Entity_Instance_ID: orchestration=system-config-update
4614 Alarm_Type: equipment
4615 Probable_Cause: unspecified-reason
4616 Service_Affecting: False
4621 Description: System config update auto-apply completed
4622 Entity_Instance_ID: orchestration=system-config-update
4624 Alarm_Type: equipment
4625 Probable_Cause: unspecified-reason
4626 Service_Affecting: False
4631 Description: System config update auto-apply abort
4632 Entity_Instance_ID: orchestration=system-config-update
4634 Alarm_Type: equipment
4635 Probable_Cause: unspecified-reason
4636 Service_Affecting: False
4641 Description: System config update auto-apply aborting
4642 Entity_Instance_ID: orchestration=system-config-update
4644 Alarm_Type: equipment
4645 Probable_Cause: unspecified-reason
4646 Service_Affecting: False
4651 Description: System config update auto-apply abort rejected
4652 Entity_Instance_ID: orchestration=system-config-update
4654 Alarm_Type: equipment
4655 Probable_Cause: unspecified-reason
4656 Service_Affecting: False
4661 Description: System config update auto-apply abort failed
4662 Entity_Instance_ID: orchestration=system-config-update
4664 Alarm_Type: equipment
4665 Probable_Cause: unspecified-reason
4666 Service_Affecting: False
4671 Description: System config update auto-apply aborted
4672 Entity_Instance_ID: orchestration=system-config-update
4674 Alarm_Type: equipment
4675 Probable_Cause: unspecified-reason
4676 Service_Affecting: False
4681 Description: Node <hostname> tainted.
4682 Entity_Instance_ID: host=<hostname>
4684 Proposed_Repair_Action: |-
4685 "Execute 'kubectl taint nodes <hostname> services=disabled:NoExecute-'
4686 If it fails, Execute 'system host-lock <hostname>' followed by
4687 'system host-unlock <hostname>'.
4688 If issue still persists, contact next level of support."
4689 Maintenance_Action: none
4691 Alarm_Type: operational-violation
4692 Probable_Cause: unknown
4693 Service_Affecting: True
4695 Management_Affecting_Severity: warning
4696 Degrade_Affecting_Severity: major