After a failed attempt at migrating our HostedEngine to a new iSCSI storage 
domain, we're unable to restart the original HostedEngine.  

Please see below for some details, and let me know what more information I can 
provide.  "Lnxvirt07" was the Host used to attempt the migration.  Any help 
would be greatly appreciated.

Many thanks,
Devin

------
[root@lnxvirt01 ~]# tail -n 5 /var/log/ovirt-hosted-engine-ha/agent.log
MainThread::INFO::2023-11-01 
12:29:53,514::state_decorators::51::ovirt_hosted_engine_ha.agent.hosted_engine.HostedEngine::(check)
 Global maintenance detected
MainThread::INFO::2023-11-01 
12:29:54,151::ovf_store::117::ovirt_hosted_engine_ha.lib.ovf.ovf_store.OVFStore::(scan)
 Found OVF_STORE: imgUUID:05ef954f-d06d-401c-85ec-5992e2afbe7d, 
volUUID:d2860f1d-19cf-4084-8a7e-d97880c32431
MainThread::INFO::2023-11-01 
12:29:54,530::ovf_store::117::ovirt_hosted_engine_ha.lib.ovf.ovf_store.OVFStore::(scan)
 Found OVF_STORE: imgUUID:a375a35b-7a87-4df4-8d29-a5ba371fee85, 
volUUID:ef8b3dae-bcae-4d58-bea8-cf1a34872267
MainThread::ERROR::2023-11-01 
12:29:54,813::config_ovf::65::ovirt_hosted_engine_ha.agent.hosted_engine.HostedEngine.config.vm::(_get_vm_conf_content_from_ovf_store)
 Failed extracting VM OVF from the OVF_STORE volume, falling back to initial 
vm.conf
MainThread::INFO::2023-11-01 
12:29:54,843::hosted_engine::531::ovirt_hosted_engine_ha.agent.hosted_engine.HostedEngine::(_monitoring_loop)
 Current state GlobalMaintenance (score: 3400)

[root@lnxvirt01 ~]# hosted-engine --vm-start
Command VM.getStats with args {'vmID': 'e6370d8f-c083-4f28-83d0-a232d693e07a'} 
failed:
(code=1, message=Virtual machine does not exist: {'vmId': 
'e6370d8f-c083-4f28-83d0-a232d693e07a'})
Command VM.create with args {'vmID': 'e6370d8f-c083-4f28-83d0-a232d693e07a', 
'vmParams': {'vmId': 'e6370d8f-c083-4f28-83d0-a232d693e07a', 'memSize': 
'16384', 'display': 'vnc', 'vmName': 'HostedEngine', 'smp': '4', 'maxVCpus': 
'40', 'cpuType': 'Haswell-noTSX', 'emulatedMachine': 'pc', 'devices': 
[{'index': '2', 'iface': 'ide', 'address': {'controller': '0', 'target': '0', 
'unit': '0', 'bus': '1', 'type': 'drive'}, 'specParams': {}, 'readonly': 
'true', 'deviceId': 'b3e2f40a-e28d-493c-af50-c1193fb9dc97', 'path': '', 
'device': 'cdrom', 'shared': 'false', 'type': 'disk'}, {'index': '0', 'iface': 
'virtio', 'format': 'raw', 'poolID': '00000000-0000-0000-0000-000000000000', 
'volumeID': '6afa3b19-7a1a-4e5c-a681-eed756d316e9', 'imageID': 
'94628710-cf73-4589-bd84-e58f741a4d5f', 'specParams': {}, 'readonly': 'false', 
'domainID': '555ad71c-1a4e-42b3-af8c-db39d9b9df67', 'optional': 'false', 
'deviceId': '6afa3b19-7a1a-4e5c-a681-eed756d316e9', 'address': {'bus': '0x00', 
'slot': '0x06', 'domain': '0x0000', 'type': 'pci', 'function': '0x0'}, 
'device': 'disk', 'shared': 'exclusive', 'propagateErrors': 'off', 'type': 
'disk', 'bootOrder': '1'}, {'device': 'scsi', 'model': 'virtio-scsi', 'type': 
'controller'}, {'nicModel': 'pv', 'macAddr': '00:16:3e:3b:3f:14', 'linkActive': 
'true', 'network': 'ovirtmgmt', 'specParams': {}, 'deviceId': 
'002afd06-9649-4ac5-a5e8-1a4945c3c136', 'address': {'bus': '0x00', 'slot': 
'0x03', 'domain': '0x0000', 'type': 'pci', 'function': '0x0'}, 'device': 
'bridge', 'type': 'interface'}, {'device': 'console', 'type': 'console'}, 
{'device': 'vga', 'alias': 'video0', 'type': 'video'}, {'device': 'vnc', 
'type': 'graphics'}, {'device': 'virtio', 'specParams': {'source': 'urandom'}, 
'model': 'virtio', 'type': 'rng'}]}} failed:
(code=100, message=General Exception: ("'xml'",))
VM failed to launch

[root@lnxvirt01 ~]# cat /etc/ovirt-hosted-engine/hosted-engine.conf 
fqdn=lnxvirt-engine.classe.cornell.edu
vm_disk_id=94628710-cf73-4589-bd84-e58f741a4d5f
vm_disk_vol_id=6afa3b19-7a1a-4e5c-a681-eed756d316e9
vmid=e6370d8f-c083-4f28-83d0-a232d693e07a
storage=192.168.56.50,192.168.56.51,192.168.56.52,192.168.56.53
nfs_version=
mnt_options=
conf=/var/run/ovirt-hosted-engine-ha/vm.conf
host_id=8
console=vnc
domainType=iscsi
spUUID=00000000-0000-0000-0000-000000000000
sdUUID=555ad71c-1a4e-42b3-af8c-db39d9b9df67
connectionUUID=e29cf818-5ee5-46e1-85c1-8aeefa33e95d
vdsm_use_ssl=true
gateway=192.168.55.1
bridge=ovirtmgmt
network_test=dns
tcp_t_address=
tcp_t_port=
metadata_volume_UUID=2bf987a2-ab81-454c-9fc7-dc7ec8945fd9
metadata_image_UUID=35429b63-16ca-417a-b87a-d232463bf6a3
lockspace_volume_UUID=b0d09780-2047-433c-812d-10ba0beff788
lockspace_image_UUID=8ccb878d-9938-43c8-908b-e1b416fe991c
conf_volume_UUID=0b40ac60-499e-4ff1-83d0-fc578f1af3dc
conf_image_UUID=551d4fe5-a9f7-4ba1-9951-87418362b434
# The following are used only for iSCSI storage
iqn=iqn.2002-10.com.infortrend:raid.uid58207.001
portal=1
user=
password=
port=3260,3260,3260,3260

[root@lnxvirt01 ~]# hosted-engine --vm-status
!! Cluster is in GLOBAL MAINTENANCE mode !!
--== Host lnxvirt06.classe.cornell.edu (id: 1) status ==--
Host ID                            : 1
Host timestamp                     : 3718817
Score                              : 3400
Engine status                      : {"vm": "down", "health": "bad", "detail": 
"unknown", "reason": "vm not running on this host"}
Hostname                           : lnxvirt06.classe.cornell.edu
Local maintenance                  : False
stopped                            : False
crc32                              : 233a1425
conf_on_shared_storage             : True
local_conf_timestamp               : 3718818
Status up-to-date                  : True
Extra metadata (valid at timestamp):
metadata_parse_version=1
metadata_feature_version=1
timestamp=3718817 (Wed Nov  1 12:26:35 2023)
host-id=1
score=3400
vm_conf_refresh_time=3718818 (Wed Nov  1 12:26:37 2023)
conf_on_shared_storage=True
maintenance=False
state=GlobalMaintenance
stopped=False
--== Host lnxvirt05.classe.cornell.edu (id: 2) status ==--
Host ID                            : 2
Host timestamp                     : 3719461
Score                              : 3400
Engine status                      : {"vm": "down", "health": "bad", "detail": 
"unknown", "reason": "vm not running on this host"}
Hostname                           : lnxvirt05.classe.cornell.edu
Local maintenance                  : False
stopped                            : False
crc32                              : b3c81abe
conf_on_shared_storage             : True
local_conf_timestamp               : 3719462
Status up-to-date                  : True
Extra metadata (valid at timestamp):
metadata_parse_version=1
metadata_feature_version=1
timestamp=3719461 (Wed Nov  1 12:26:41 2023)
host-id=2
score=3400
vm_conf_refresh_time=3719462 (Wed Nov  1 12:26:42 2023)
conf_on_shared_storage=True
maintenance=False
state=GlobalMaintenance
stopped=False
--== Host lnxvirt04.classe.cornell.edu (id: 3) status ==--
Host ID                            : 3
Host timestamp                     : 3718684
Score                              : 3400
Engine status                      : {"vm": "down", "health": "bad", "detail": 
"unknown", "reason": "vm not running on this host"}
Hostname                           : lnxvirt04.classe.cornell.edu
Local maintenance                  : False
stopped                            : False
crc32                              : 03a57b14
conf_on_shared_storage             : True
local_conf_timestamp               : 3718686
Status up-to-date                  : True
Extra metadata (valid at timestamp):
metadata_parse_version=1
metadata_feature_version=1
timestamp=3718684 (Wed Nov  1 12:26:41 2023)
host-id=3
score=3400
vm_conf_refresh_time=3718686 (Wed Nov  1 12:26:43 2023)
conf_on_shared_storage=True
maintenance=False
state=GlobalMaintenance
stopped=False
--== Host lnxvirt03.classe.cornell.edu (id: 4) status ==--
Host ID                            : 4
Host timestamp                     : 3719430
Score                              : 3400
Engine status                      : {"vm": "down", "health": "bad", "detail": 
"unknown", "reason": "vm not running on this host"}
Hostname                           : lnxvirt03.classe.cornell.edu
Local maintenance                  : False
stopped                            : False
crc32                              : adb1aad2
conf_on_shared_storage             : True
local_conf_timestamp               : 3719432
Status up-to-date                  : True
Extra metadata (valid at timestamp):
metadata_parse_version=1
metadata_feature_version=1
timestamp=3719430 (Wed Nov  1 12:26:35 2023)
host-id=4
score=3400
vm_conf_refresh_time=3719432 (Wed Nov  1 12:26:36 2023)
conf_on_shared_storage=True
maintenance=False
state=GlobalMaintenance
stopped=False
--== Host lnxvirt02.classe.cornell.edu (id: 5) status ==--
Host ID                            : 5
Host timestamp                     : 3719408
Score                              : 3400
Engine status                      : {"vm": "down", "health": "bad", "detail": 
"unknown", "reason": "vm not running on this host"}
Hostname                           : lnxvirt02.classe.cornell.edu
Local maintenance                  : False
stopped                            : False
crc32                              : 1996a067
conf_on_shared_storage             : True
local_conf_timestamp               : 3719410
Status up-to-date                  : True
Extra metadata (valid at timestamp):
metadata_parse_version=1
metadata_feature_version=1
timestamp=3719408 (Wed Nov  1 12:26:39 2023)
host-id=5
score=3400
vm_conf_refresh_time=3719410 (Wed Nov  1 12:26:41 2023)
conf_on_shared_storage=True
maintenance=False
state=GlobalMaintenance
stopped=False
--== Host lnxvirt07.classe.cornell.edu (id: 7) status ==--
Host ID                            : 7
Host timestamp                     : 495392
Score                              : 0
Engine status                      : unknown stale-data
Hostname                           : lnxvirt07.classe.cornell.edu
Local maintenance                  : False
stopped                            : True
crc32                              : 2572e907
conf_on_shared_storage             : True
local_conf_timestamp               : 495352
Status up-to-date                  : False
Extra metadata (valid at timestamp):
metadata_parse_version=1
metadata_feature_version=1
timestamp=495392 (Tue Oct 31 10:20:12 2023)
host-id=7
score=0
vm_conf_refresh_time=495352 (Tue Oct 31 10:19:33 2023)
conf_on_shared_storage=True
maintenance=False
state=AgentStopped
stopped=True
--== Host lnxvirt01.classe.cornell.edu (id: 8) status ==--
Host ID                            : 8
Host timestamp                     : 1729103
Score                              : 3400
Engine status                      : {"vm": "down", "health": "bad", "detail": 
"unknown", "reason": "vm not running on this host"}
Hostname                           : lnxvirt01.classe.cornell.edu
Local maintenance                  : False
stopped                            : False
crc32                              : 2e57e99d
conf_on_shared_storage             : True
local_conf_timestamp               : 1729104
Status up-to-date                  : True
Extra metadata (valid at timestamp):
metadata_parse_version=1
metadata_feature_version=1
timestamp=1729103 (Wed Nov  1 12:26:31 2023)
host-id=8
score=3400
vm_conf_refresh_time=1729104 (Wed Nov  1 12:26:33 2023)
conf_on_shared_storage=True
maintenance=False
state=GlobalMaintenance
stopped=False
!! Cluster is in GLOBAL MAINTENANCE mode !!

_______________________________________________
Users mailing list -- users@ovirt.org
To unsubscribe send an email to users-le...@ovirt.org
Privacy Statement: https://www.ovirt.org/privacy-policy.html
oVirt Code of Conduct: 
https://www.ovirt.org/community/about/community-guidelines/
List Archives: 
https://lists.ovirt.org/archives/list/users@ovirt.org/message/MAFELYQTNEWFISW4A2IE2P5PD4B7ZZC6/

Reply via email to