I am trying to follow the baremetal install on a single node and it gets stuck on hive2.
I see:
ERROR [2021-06-07 08:52:58,773] se.kth.karamel.backend.dag.DagNode: Failed 'hive2::install on 172.17.0.3' because '172.17.0.3: Command did not complete: mkdir -p /home/hopsworks/.karamel/install ; cd /home/hopsworks/.karamel/install; echo $$ > pid; echo '#!/bin/bash
set -eo pipefail
echo $(date '+%H:%M:%S'): 'hive2__install' >> order
cat > hive2__install.json <<-'END_OF_FILE'
{
"hopsmonitor": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"alertmanager": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"prometheus": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"node_exporter": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"ndb": {
"mysqld": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"ndbd": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"mgmd": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"NoOfReplicas": "1",
"DataMemory": "4096"
},
"flink": {
"yarn": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"historyserver": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"hopslog": {
"_filebeat-spark": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"_filebeat-jupyter": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"_filebeat-serving": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"_filebeat-beam": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"kagent": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"consul": {
"master": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"hops": {
"rm": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"ndb": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"nn": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"nm": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"dn": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"docker_registry": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"jhs": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"tls": {
"enabled": "false"
},
"rmappsecurity": {
"actor_class": "org.apache.hadoop.yarn.server.resourcemanager.security.DevHopsworksRMAppSecurityActions"
},
"yarn": {
"pcores-vcores-multiplier": "0.66",
"cgroups_strict_resource_usage": "false",
"detect-hardware-capabilities": "true",
"system-reserved-memory-mb": "4000"
}
},
"hops_airflow": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"sqoop": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"kzookeeper": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"epipe": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"elastic": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"opendistro_security": {
"logstash": {
"password": "6bbb058e_201",
"username": "logstash"
},
"epipe": {
"username": "epipe",
"password": "6bbb058e_201"
},
"admin": {
"username": "admin",
"password": "6bbb058e_201"
},
"audit": {
"enable_transport": "false",
"enable_rest": "true"
},
"jwt": {
"exp_ms": "1800000"
},
"kibana": {
"password": "6bbb058e_201",
"username": "kibana"
},
"elastic_exporter": {
"username": "elasticexporter",
"password": "6bbb058e_201"
}
}
},
"hadoop_spark": {
"historyserver": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"yarn": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"hive2": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"mysql_password": "6bbb058e_203"
},
"kkafka": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"tensorflow": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"conda": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"livy": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
}
},
"hopsworks": {
"default": {
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"private_ips_domainIds": {
"172.17.0.3": "0"
},
"hosts": {
"172.17.0.3": "172.17.0.3"
}
},
"application_certificate_validity_period": "6d",
"kagent_liveness": {
"threshold": "40s",
"enabled": "true"
},
"requests_verify": "false",
"featurestore_online": "true",
"admin": {
"password": "6bbb058e_201",
"user": "adminuser"
},
"encryption_password": "6bbb058e_001",
"master": {
"password": "6bbb058e_002"
},
"https": {
"port": "443"
}
},
"install": {
"kubernetes": "false",
"dir": "/srv/hops",
"cloud": "none"
},
"mysql": {
"password": "6bbb058e_202"
},
"alertmanager": {
"email": {
"to": "sre@logicalclocks.com",
"smtp_host": "mail.hello.com",
"from": "hopsworks@logicalclocks.com"
}
},
"prometheus": {
"retention_time": "8h"
},
"private_ips": [
"172.17.0.3"
],
"public_ips": [
"172.17.0.3"
],
"hosts": {
"172.17.0.3": "172.17.0.3"
},
"run_list": [
"hive2::install"
]
}
END_OF_FILE
echo "%password_hidden%" | sudo -S chef-solo -c /home/hopsworks/.karamel/install/solo.rb -j /home/hopsworks/.karamel/install/hive2__install.json 2>&1 | tee hive2__install.log
echo 'https://github.com/logicalclocks/hive-chef/tree/2.1/hive2::install' >> succeed_list
' > hive2__install.sh ; chmod +x hive2__install.sh ; ./hive2__install.sh
', DAG is stuck here :(
in the installation logs.
Any ideas?