Root cause: The script expects that something sets up passwordless root login to the same node. The stage fails with "Host key verification failed." message due to empty /root/.ssh/known_hosts
file.
cluster:
type: single # single/ees/ecs
node_list:
- eosnode-1
eosnode-1:
hostname: smc19-m10
is_primary: true
network:
mgmt_if: eno1 # Management network interfaces for bonding
data_if: bond0 # Management network interfaces for bonding
gateway_ip: # No Implementation
storage:
metadata_device: # Device for /var/mero and possibly SWAP
- /dev/mapper/mpathn
data_devices: # Data device/LUN from storage enclosure
- /dev/mapper/mpatho
- /dev/mapper/mpathb
- /dev/mapper/mpathc
- /dev/mapper/mpathd
- /dev/mapper/mpathe
- /dev/mapper/mpathf
- /dev/mapper/mpathg
storage_enclosure:
id: storage_node_1 # equivalent to fqdn for server node
type: 5U84 # Type of enclosure. E.g. 5U84/PODS
controller:
type: gallium # Type of controller on storage node. E.g. gallium/indium/sati
primary_mc:
ip: 127.0.0.1
port: 8090
secondary_mc:
ip: 127.0.0.1
port: 8090
user: user
password: 'passwd'
520406@smc19-m10:~> facter --json hostname fqdn processorcount memorysize_mb ipaddress_bond0
{
"hostname": "smc19-m10",
"fqdn": "smc19-m10.mero.colo.seagate.com",
"processorcount": 48,
"memorysize_mb": "191890.84",
"ipaddress_bond0": "172.16.0.105"
}
[root@smc19-m10 .ssh]# stat /root/.ssh/known_hosts
File: ‘/root/.ssh/known_hosts’
Size: 0 Blocks: 0 IO Block: 4096 regular empty file
Device: fd00h/64768d Inode: 269550664 Links: 1
Access: (0644/-rw-r--r--) Uid: ( 0/ root) Gid: ( 0/ root)
Access: 2020-02-13 12:56:50.020410854 +0000
Modify: 2020-02-13 06:37:15.000000000 +0000
Change: 2020-02-13 10:16:33.283170230 +0000
Birth: -
[root@smc19-m10 .ssh]# head -v -n 100 /root/.ssh/*
==> /root/.ssh/authorized_keys <==
ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQCg6WBK+qXSDIunMgCpxUgcTfMnSO/WLBi6UikIfvbCzcf0+8JkpT/4zbwX3tnT+6ayb6eY0Qo6MlP5qd2OQb4MxPRVDHW8F4o/WAV41+CLdojGPGFSuWyCUOg6GfCPz7n1nKJmuTQ6DpYddQR9s1kIPVjRXDXiAJ8a8FkhJqKOVYDXNMEJ01YNF9fLepWFj8aScw0HalvvvXVq4RNynEDOmqGmLOLzBDVw8XpbDPUNVUxMyUf97ObXRL9KgQIToNoTYte5liQ9jyk7qupRxzZQr3z/7wC80SUkbKvBtC4S0FmWIhvROwOwZVhcMFUT30KavACW0fRd9FOUOP+wxQVp1v5fQBiOoCnoYZbKRNZN/rQmcecIhdFZfTZnq2HFF0kpu17hVa2cMqSbvRstxVot+FpxAH9HaVUMDuOngRpxzLSCXzp8sxSRGAwG2dEKnL/zTk6NPv4ED3645X4zGRBfPpO7eFcd/qoRw5FKwyFZa3/zzE2hre12I+H0+LHCoTU= 714502@PUN-U714502L001
==> /root/.ssh/config <==
Host eosnode-1
HostName eosnode-1
User root
UserKnownHostsFile /dev/null
StrictHostKeyChecking no
IdentityFile /root/.ssh/id_rsa_prvsnr
IdentitiesOnly yes
Host eosnode-2
HostName eosnode-2
User root
UserKnownHostsFile /dev/null
StrictHostKeyChecking no
IdentityFile /root/.ssh/id_rsa_prvsnr
IdentitiesOnly yes
==> /root/.ssh/id_rsa_prvsnr <==
-----BEGIN OPENSSH PRIVATE KEY-----
b3BlbnNzaC1rZXktdjEAAAAABG5vbmUAAAAEbm9uZQAAAAAAAAABAAABlwAAAAdzc2gtcn
...
20+x/gO5FXISdjAAAAFjcxNDUwMkBQVU4tVTcxNDUwMkwwMDEBAgME
-----END OPENSSH PRIVATE KEY-----
==> /root/.ssh/id_rsa_prvsnr.pub <==
ssh-rsa AAAAB3NzaC1yc2EAAAADAQABAAABgQCg6WBK+qXSDIunMgCpxUgcTfMnSO/WLBi6UikIfvbCzcf0+8JkpT/4zbwX3tnT+6ayb6eY0Qo6MlP5qd2OQb4MxPRVDHW8F4o/WAV41+CLdojGPGFSuWyCUOg6GfCPz7n1nKJmuTQ6DpYddQR9s1kIPVjRXDXiAJ8a8FkhJqKOVYDXNMEJ01YNF9fLepWFj8aScw0HalvvvXVq4RNynEDOmqGmLOLzBDVw8XpbDPUNVUxMyUf97ObXRL9KgQIToNoTYte5liQ9jyk7qupRxzZQr3z/7wC80SUkbKvBtC4S0FmWIhvROwOwZVhcMFUT30KavACW0fRd9FOUOP+wxQVp1v5fQBiOoCnoYZbKRNZN/rQmcecIhdFZfTZnq2HFF0kpu17hVa2cMqSbvRstxVot+FpxAH9HaVUMDuOngRpxzLSCXzp8sxSRGAwG2dEKnL/zTk6NPv4ED3645X4zGRBfPpO7eFcd/qoRw5FKwyFZa3/zzE2hre12I+H0+LHCoTU= 714502@PUN-U714502L001
==> /root/.ssh/known_hosts <==
[root@smc19-m10 .ssh]#
$ sudo salt eosnode-1 state.apply components.hare
...
<successful stages>
...
----------
ID: Stage - Initialize Hare
Function: cmd.run
Name: __slot__:salt:setup_conf.conf_cmd('/opt/seagate/eos/hare/conf/setup.yaml', 'hare:init')
Result: False
Comment: Command "/opt/seagate/eos/hare/libexec/prov-init /var/lib/hare/cluster.yaml" run
Started: 13:07:53.058719
Duration: 367.186 ms
Changes:
----------
pid:
54630
retcode:
1
stderr:
?[1;33mWarning?[0m: Could not locate a cache base directory from the environment.
You can provide a cache base directory by pointing the $XDG_CACHE_HOME
environment variable to a directory with read and write permissions.
Host key verification failed.
Traceback (most recent call last):
File "/opt/seagate/eos/hare/bin/../bin/cfgen", line 1397, in <module>
main()
File "/opt/seagate/eos/hare/bin/../bin/cfgen", line 121, in main
enrich_cluster_desc(cluster_desc, opts.mock)
File "/opt/seagate/eos/hare/bin/../bin/cfgen", line 215, in enrich_cluster_desc
ipaddr_key(node['data_iface']))
File "/opt/seagate/eos/hare/bin/../bin/cfgen", line 294, in get_facts
return json.loads(run_command(hostname, 'facter', '--json', *args))
File "/opt/seagate/eos/hare/bin/../bin/cfgen", line 288, in run_command
timeout=15).decode()
File "/usr/lib64/python3.6/subprocess.py", line 356, in check_output
**kwargs).stdout
File "/usr/lib64/python3.6/subprocess.py", line 438, in run
output=stdout, stderr=stderr)
subprocess.CalledProcessError: Command '['ssh', 'smc19-m10', 'facter', '--json', 'hostname', 'fqdn', 'processorcount', 'memorysize_mb', 'ipaddress_bond0']' returned non-zero exit status 255.
stdout:
2020-02-13 13:07:53: Generating cluster configuration...
----------