diff options
author | Andrew Gauld <ag1282@att.com> | 2017-08-22 13:33:45 +0000 |
---|---|---|
committer | Andrew Gauld <ag1282@att.com> | 2017-08-22 13:38:55 +0000 |
commit | 4e7e20ec06a7d861a2723a454f123ce562bbce73 (patch) | |
tree | 239fd340ff2a5aed066d965e29a9f55f12a2912a /scripts/cdap-init.sh | |
parent | c5da71b7b389a42e5171899815d4cb8081384fa2 (diff) |
Seed code for deploying DCAE
Change-Id: Ie1a2faf2dd4731ef12aeeed8ecc49f329e68385c
Issue-Id: DCAEGEN2-78
Signed-off-by: Andrew Gauld <ag1282@att.com>
Diffstat (limited to 'scripts/cdap-init.sh')
-rw-r--r-- | scripts/cdap-init.sh | 387 |
1 files changed, 387 insertions, 0 deletions
diff --git a/scripts/cdap-init.sh b/scripts/cdap-init.sh new file mode 100644 index 0000000..2484f53 --- /dev/null +++ b/scripts/cdap-init.sh @@ -0,0 +1,387 @@ +# ============LICENSE_START==================================================== +# org.onap.dcae +# ============================================================================= +# Copyright (c) 2017 AT&T Intellectual Property. All rights reserved. +# ============================================================================= +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============LICENSE_END====================================================== + +set -x +# +# get configuration +# +CODE_SOURCE=$1 +CODE_VERSION=$2 +CLUSTER_INDEX=$3 +CLUSTER_SIZE=$4 +CLUSTER_FQDNS=$5 +CLUSTER_LOCAL_IPS=$6 +CLUSTER_FLOATING_IPS=$7 +DATACENTER=$8 +REGISTERED_NAME=$9 +export JAVA_HOME=/usr/lib/jvm/default-java +md5sum /root/.sshkey/id_rsa | awk '{ print $1 }' >/root/.mysqlpw +chmod 400 /root/.mysqlpw +# +# enable outside apt repositories +# +wget -qO- http://public-repo-1.hortonworks.com/HDP/ubuntu16/2.x/updates/2.6.0.3/hdp.list >/etc/apt/sources.list.d/hdp.list +wget -qO- http://repository.cask.co/ubuntu/precise/amd64/cdap/4.1/cask.list >/etc/apt/sources.list.d/cask.list +wget -qO- http://repository.cask.co/ubuntu/precise/amd64/cdap/4.1/pubkey.gpg | apt-key add - +apt-key adv --recv-keys --keyserver keyserver.ubuntu.com B9733A7A07513CAD +apt-get update +# +# install software from apt repositories +# +apt-get install -y default-jdk hadoop-hdfs hadoop-mapreduce hive hbase libsnappy-dev liblzo2-dev hadooplzo spark-master spark-python zip unzip +usermod -a -G hadoop hive +if [ $CLUSTER_INDEX -lt 3 ] +then + apt-get install -y zookeeper-server + cat <<!EOF >>/etc/zookeeper/conf/zookeeper-env.sh +export JAVA_HOME=/usr/lib/jvm/default-java +export ZOOCFGDIR=/etc/zookeeper/conf +export ZOO_LOG_DIR=/var/log/zookeeper +export ZOOPIDFILE=/var/run/zookeeper/zookeeper_server.pid +!EOF + mkdir -p /var/lib/zookeeper + chown zookeeper:zookeeper /var/lib/zookeeper + cp /usr/hdp/current/zookeeper-server/etc/init.d/zookeeper-server /etc/init.d/. + update-rc.d zookeeper-server defaults + service zookeeper-server start +fi +if [ $CLUSTER_INDEX -eq 2 ] +then + debconf-set-selections <<! +mysql-server mysql-server/root_password password $(cat /root/.mysqlpw) +! + debconf-set-selections <<! +mysql-server mysql-server/root_password_again password $(cat /root/.mysqlpw) +! + apt-get install -y cdap cdap-cli cdap-gateway cdap-kafka cdap-master cdap-security cdap-ui mysql-server mysql-connector-java +set +x +echo + mysql_secure_installation --use-default +mysql_secure_installation --use-default --password=$(cat /root/.mysqlpw) +set -x + mysql_install_db + cp /usr/share/java/mysql-connector-java-*.jar /usr/hdp/current/hive-client/lib/. + mkdir -p /usr/lib/hive/logs + chown -R hive:hadoop /usr/lib/hive + chmod -R 755 /usr/lib/hive +fi +# +# make directories +# +mkdir -p /hadoop/hdfs/journalnode/cl /hadoop/hdfs/namenode /hadoop/hdfs/data /etc/hadoop/conf /hadoop/yarn/local /hadoop/yarn/log /usr/lib/hadoop/logs /usr/lib/hadoop-mapreduce/logs /usr/lib/hadoop-yarn/logs /usr/lib/hbase/logs /etc/cdap/conf +# +# set up config files +# +HDPVER=$(ls /usr/hdp | grep -v current) +echo -Dhdp.version=$HDPVER >/usr/hdp/current/spark-client/conf/java-opts +echo "export OPTS=\"\${OPTS} -Dhdp.version=$HDPVER\"" >>/etc/cdap/conf/cdap-env.sh +cat >/etc/profile.d/hadoop.sh <<'!EOF' +HADOOP_PREFIX=/usr/hdp/current/hadoop-client +HADOOP_YARN_HOME=/usr/hdp/current/hadoop-yarn-nodemanager +HADOOP_HOME=/usr/hdp/current/hadoop-client +HADOOP_COMMON_HOME=$HADOOP_HOME +HADOOP_CONF_DIR=/etc/hadoop/conf +HADOOP_HDFS_HOME=/usr/hdp/current/hadoop-hdfs-namenode +HADOOP_LIBEXEC_DIR=$HADOOP_HOME/libexec +YARN_LOG_DIR=/usr/lib/hadoop-yarn/logs +HADOOP_LOG_DIR=/usr/lib/hadoop/logs +JAVA_HOME=/usr/lib/jvm/default-java +JAVA=$JAVA_HOME/bin/java +PATH=$PATH:$HADOOP_HOME/bin +HBASE_LOG_DIR=/usr/lib/hbase/logs +HADOOP_MAPRED_LOG_DIR=/usr/lib/hadoop-mapreduce/logs +HBASE_CONF_DIR=/etc/hbase/conf +export HADOOP_PREFIX HADOOP_HOME HADOOP_COMMON_HOME HADOOP_CONF_DIR HADOOP_HDFS_HOME JAVA_HOME PATH HADOOP_LIBEXEC_DIR JAVA JARN_LOG_DIR HADOOP_LOG_DIR HBASE_LOG_DIR HADOOP_MAPRED_LOG_DIR HBASE_CONF_DIR +!EOF +chmod 755 /etc/profile.d/hadoop.sh +cat </etc/profile.d/hadoop.sh >>/etc/hadoop/conf/hadoop-env.sh +mv /root/.sshkey /var/lib/hadoop-hdfs/.ssh +cp /var/lib/hadoop-hdfs/.ssh/id_rsa.pub /var/lib/hadoop-hdfs/.ssh/authorized_keys +>/etc/hadoop/conf/dfs.exclude +>/etc/hadoop/conf/yarn.exclude +chown -R hdfs:hadoop /var/lib/hadoop-hdfs/.ssh /hadoop /usr/lib/hadoop +chown -R yarn:hadoop /usr/lib/hadoop-yarn /hadoop/yarn +chown -R mapred:hadoop /usr/lib/hadoop-mapreduce +chown -R hbase:hbase /usr/lib/hbase +chmod 700 /var/lib/hadoop-hdfs/.ssh +chmod 600 /var/lib/hadoop-hdfs/.ssh/* +sed -i -e '/maxClientCnxns/d' /etc/zookeeper/conf/zoo.cfg + +cat >/tmp/init.py <<!EOF +import os +with open('/root/.mysqlpw', 'r') as f: + mysqlpw = f.readline().strip() +myid=int('$CLUSTER_INDEX') +count=$CLUSTER_SIZE +fqdns='$CLUSTER_FQDNS'.split(',') +localips='$CLUSTER_LOCAL_IPS'.split(',') +floatingips='$CLUSTER_FLOATING_IPS'.split(',') +with open('/etc/hosts', 'a') as f: + f.write("\n") + for index in range(0, count): + hn=fqdns[index][0: fqdns[index].index('.')] + f.write("{ip} {fqdn} {hn}\n".format(ip=localips[index],hn=hn,fqdn=fqdns[index])) + +def pxc(f, m): + a = "<?xml version='1.0' encoding='UTF-8'?>\n<?xml-stylesheet type='text/xsl' href='configuration.xsl'?>\n<configuration>" + for n in m.keys(): + a = a + "\n <property>\n <name>{n}</name>\n <value>{v}</value>\n </property>".format(n=n,v=m[n]) + a = a + "\n</configuration>\n" + with open(f, 'w') as xml: + xml.write(a) +pxc('/etc/hadoop/conf/core-site.xml', { + 'fs.defaultFS':'hdfs://cl' + }) +pxc('/etc/hadoop/conf/hdfs-site.xml', { + 'dfs.namenode.datanode.registration.ip-hostname-check':'false', + 'dfs.namenode.name.dir':'/hadoop/hdfs/namenode', + 'dfs.hosts.exclude':'/etc/hadoop/conf/dfs.exclude', + 'dfs.datanode.data.dir':'/hadoop/hdfs/data', + 'dfs.journalnode.edits.dir':'/hadoop/hdfs/journalnode', + 'dfs.nameservices':'cl', + 'dfs.ha.namenodes.cl':'nn1,nn2', + 'dfs.namenode.rpc-address.cl.nn1':localips[0]+':8020', + 'dfs.namenode.rpc-address.cl.nn2':localips[1]+':8020', + 'dfs.namenode.http-address.cl.nn1':localips[0]+':50070', + 'dfs.namenode.http-address.cl.nn2':localips[1]+':50070', + 'dfs.namenode.shared.edits.dir':'qjournal://'+localips[0]+':8485;'+localips[1]+':8485;'+localips[2]+':8485/cl', + 'dfs.journalnode.edits.dir':'/hadoop/hdfs/journalnode', + 'dfs.client.failover.proxy.provider.cl':'org.apache.hadoop.hdfs.server.namenode.ha.ConfiguredFailoverProxyProvider', + 'dfs.ha.fencing.methods':'sshfence(hdfs),shell(/bin/true)', + 'dfs.ha.fencing.ssh.private-key-files':'/var/lib/hadoop-hdfs/.ssh/id_rsa', + 'dfs.ha.fencing.ssh.connect-timeout':'30000', + 'dfs.ha.automatic-failover.enabled':'true', + 'ha.zookeeper.quorum':localips[0]+':2181,'+localips[1]+':2181,'+localips[2]+':2181' + }) +pxc('/etc/hadoop/conf/yarn-site.xml', { + 'yarn.nodemanager.vmem-check-enabled':'false', + 'yarn.application.classpath':'/etc/hadoop/conf,/usr/hdp/current/hadoop-client/*,/usr/hdp/current/hadoop-client/lib/*,/usr/hdp/current/hadoop-hdfs-client/*,/usr/hdp/current/hadoop-hdfs-client/lib/*,/usr/hdp/current/hadoop-yarn-client/*,/usr/hdp/current/hadoop-yarn-client/lib/*', + 'yarn.nodemanager.delete.debug-delay-sec':'43200', + 'yarn.scheduler.minimum-allocation-mb':'512', + 'yarn.scheduler.maximum-allocation-mb':'8192', + 'yarn.nodemanager.local-dirs':'/hadoop/yarn/local', + 'yarn.nodemanager.log-dirs':'/hadoop/yarn/log', + 'yarn.resourcemanager.zk-address':localips[0]+':2181,'+localips[1]+':2181,'+localips[2]+':2181', + 'yarn.resourcemanager.ha.enabled':'true', + 'yarn.resourcemanager.ha.rm-ids':'rm1,rm2', + 'yarn.resourcemanager.hostname.rm1':localips[1], + 'yarn.resourcemanager.hostname.rm2':localips[2], + 'yarn.resourcemanager.cluster-id':'cl', + 'yarn.resourcemanager.recovery-enabled':'true', + 'yarn.resourcemanager.store.class':'org.apache.hadoop.yarn.server.resourcemanager.recovery.ZKRMStateStore', + 'yarn.resourcemanager.nodes.exclude-path':'/etc/hadoop/conf/yarn.exclude' + }) +pxc('/etc/hadoop/conf/mapred-site.xml', { + 'mapreduce.application.classpath':'/etc/hadoop/conf,/usr/lib/hadoop/lib/*,/usr/lib/hadoop/*,/usr/hdp/current/hadoop-hdfs-namenode/,/usr/hdp/current/hadoop-hdfs-namenode/lib/*,/usr/hdp/current/hadoop-hdfs-namenode/*,/usr/hdp/current/hadoop-yarn-nodemanager/lib/*,/usr/hdp/current/hadoop-yarn-nodemanager/*,/usr/hdp/current/hadoop-mapreduce-historyserver/lib/*,/usr/hdp/current/hadoop-mapreduce-historyserver/*', + 'mapreduce.jobhistory.intermediate-done-dir':'/mr-history/tmp', + 'mapreduce.jobhistory.done-dir':'/mr-history/done', + 'mapreduce.jobhistory.address':localips[1], + 'mapreduce.jobhistory.webapp.address':localips[1] + }) +pxc('/etc/hbase/conf/hbase-site.xml', { + 'hbase.zookeeper.quorum':localips[0]+':2181,'+localips[1]+':2181,'+localips[2]+':2181', + 'hbase.rootdir':'hdfs://cl/apps/hbase/data', + 'hbase.cluster.distributed':'true' + }) +pxc('/etc/hive/conf/hive-site.xml', { + 'fs.file.impl.disable.cache':'true', + 'fs.hdfs.impl.disable.cache':'true', + 'hadoop.clientside.fs.operations':'true', + 'hive.auto.convert.join.noconditionaltask.size':'1000000000', + 'hive.auto.convert.sortmerge.join.noconditionaltask':'true', + 'hive.auto.convert.sortmerge.join':'true', + 'hive.enforce.bucketing':'true', + 'hive.enforce.sorting':'true', + 'hive.mapjoin.bucket.cache.size':'10000', + 'hive.mapred.reduce.tasks.speculative.execution':'false', + 'hive.metastore.cache.pinobjtypes':'Table,Database,Type,FieldSchema,Order', + 'hive.metastore.client.socket.timeout':'60s', + 'hive.metastore.local':'true', + 'hive.metastore.uris':'thrift://' + fqdns[2] + ':9083', + 'hive.metastore.warehouse.dir':'/apps/hive/warehouse', + 'hive.optimize.bucketmapjoin.sortedmerge':'true', + 'hive.optimize.bucketmapjoin':'true', + 'hive.optimize.mapjoin.mapreduce':'true', + 'hive.optimize.reducededuplication.min.reducer':'1', + 'hive.security.authorization.manager':'org.apache.hadoop.hive.ql.security.authorization.DefaultHiveAuthorizationProvider', + 'hive.semantic.analyzer.factory.impl':'org.apache.hivealog.cli.HCatSemanticAnalyzerFactory', + 'javax.jdo.option.ConnectionDriverName':'com.mysql.jdbc.Driver', + 'javax.jdo.option.ConnectionPassword': mysqlpw, + 'javax.jdo.option.ConnectionURL':'jdbc:mysql://localhost:3306/metastore?createDatabaseIfNotExist=true', + 'javax.jdo.option.ConnectionUserName':'root' + }) +if myid == 2: + pxc('/etc/cdap/conf/cdap-site.xml', { + 'zookeeper.quorum':localips[0]+':2181,'+localips[1]+':2181,'+localips[2]+':2181/\${root.namespace}', + 'router.server.address':localips[2], + 'explore.enabled':'true', + 'enable.unrecoverable.reset':'true', + 'kafka.seed.brokers':localips[2] + ':9092', + 'app.program.jvm.opts':'-XX:MaxPermSize=128M \${twill.jvm.gc.opts} -Dhdp.version=$HDPVER -Dspark.yarn.am.extraJavaOptions=-Dhdp.version=$HDPVER' + }) +with open('/etc/hbase/conf/regionservers', 'w') as f: + for ip in localips: + f.write('{ip}\n'.format(ip=ip)) +with open('/etc/hbase/conf/hbase-env.sh', 'a') as f: + f.write("export HBASE_MANAGES_ZK=false\n") +with open('/etc/zookeeper/conf/zoo.cfg', 'a') as f: + f.write("server.1={L1}:2888:3888\nserver.2={L2}:2888:3888\nserver.3={L3}:2888:3888\nmaxClientCnxns=0\nautopurge.purgeInterval=6\n".format(L1=localips[0],L2=localips[1],L3=localips[2])) +with open('/etc/clustermembers', 'w') as f: + f.write("export me={me}\n".format(me=myid)) + for idx in range(len(localips)): + f.write("export n{i}={ip}\n".format(i=idx, ip=localips[idx])) + f.write("export N{i}={ip}\n".format(i=idx, ip=floatingips[idx])) +with open('/etc/hadoop/conf/slaves', 'w') as f: + for idx in range(len(localips)): + if idx != myid: + f.write("{x}\n".format(x=localips[idx])) +if myid < 3: + with open('/var/lib/zookeeper/myid', 'w') as f: + f.write("{id}".format(id=(myid + 1))) + os.system('service zookeeper-server restart') +for ip in localips: + os.system("su - hdfs -c \"ssh -o StrictHostKeyChecking=no -o NumberOfPasswordPrompts=0 {ip} echo Connectivity to {ip} verified\"".format(ip=ip)) +!EOF + +python /tmp/init.py + +. /etc/clustermembers +waitfor() { + while ( ! nc $1 $2 </dev/null ) + do + echo waiting for $1 port $2 + sleep 30 + done +} +# journal nodes are on port 8485 +if [ $me -lt 3 ] +then + su - hdfs -c '$HADOOP_HOME/sbin/hadoop-daemon.sh start journalnode' + waitfor $n0 8485 + waitfor $n1 8485 + waitfor $n2 8485 +fi +if [ $me -eq 0 -a "$setupdone" = "" ] +then + su - hdfs -c 'hdfs namenode -format -nonInteractive' + su - hdfs -c 'hdfs zkfc -formatZK' +fi +if [ $me -eq 1 -a "$setupdone" = "" ] +then + waitfor $n0 8020 + su - hdfs -c 'hdfs namenode -bootstrapStandby -nonInteractive' + su - yarn -c 'yarn resourcemanager -format-state-store' +fi +if [ $me -eq 0 -o $me -eq 1 ] +then + su - hdfs -c '$HADOOP_HOME/sbin/hadoop-daemon.sh start zkfc' + su - hdfs -c '$HADOOP_HOME/sbin/hadoop-daemon.sh start namenode' +fi +su - hdfs -c '$HADOOP_HOME/sbin/hadoop-daemon.sh start datanode' +if [ $me -eq 1 -o $me -eq 2 ] +then + su - yarn -c '/usr/hdp/current/hadoop-yarn-nodemanager/sbin/yarn-daemon.sh start resourcemanager' +fi +su - yarn -c '/usr/hdp/current/hadoop-yarn-nodemanager/sbin/yarn-daemon.sh start nodemanager' +waitfor $n0 8020 +waitfor $n1 8020 +su - hdfs -c 'hdfs dfsadmin -safemode wait' +if [ $me -eq 1 ] +then + if [ "$setupdone" = "" ] + then + su - hdfs -c 'hdfs dfs -mkdir -p /mr-history/tmp' + su - hdfs -c 'hdfs dfs -chmod -R 1777 /mr-history/tmp' + su - hdfs -c 'hdfs dfs -mkdir -p /mr-history/done' + su - hdfs -c 'hdfs dfs -chmod -R 1777 /mr-history/done' + su - hdfs -c 'hdfs dfs -chown -R mapred:hdfs /mr-history' + su - hdfs -c 'hdfs dfs -mkdir -p /app-logs' + su - hdfs -c 'hdfs dfs -chmod -R 1777 /app-logs' + su - hdfs -c 'hdfs dfs -chown yarn:hdfs /app-logs' + su - hdfs -c 'hdfs dfs -mkdir -p /apps/hbase/staging /apps/hbase/data' + su - hdfs -c 'hdfs dfs -chown hbase:hdfs /apps/hbase/staging /apps/hbase/data' + su - hdfs -c 'hdfs dfs -chmod 711 /apps/hbase/staging' + su - hdfs -c 'hdfs dfs -chmod 755 /apps/hbase/data' + su - hdfs -c 'hdfs dfs -chown hdfs:hdfs /apps/hbase' + su - hdfs -c 'hdfs dfs -mkdir -p /user/yarn' + su - hdfs -c 'hdfs dfs -chown yarn:yarn /user/yarn' + su - hdfs -c 'hdfs dfs -mkdir -p /cdap/tx.snapshot' + su - hdfs -c 'hdfs dfs -chown yarn:yarn /cdap /cdap/tx.snapshot' + su - hdfs -c 'hdfs dfs -mkdir -p /user/hive /apps/hive/warehouse /tmp/hive' + su - hdfs -c 'hdfs dfs -chown -R hive:hadoop /user/hive /apps/hive /tmp/hive' + su - hdfs -c 'hdfs dfs -chmod -R 775 /apps/hive' + su - hdfs -c 'hdfs dfs -chmod -R 777 /tmp/hive' + fi + su - mapred -c '/usr/hdp/current/hadoop-mapreduce-historyserver/sbin/mr-jobhistory-daemon.sh start historyserver' + su - hbase -c '/usr/hdp/current/hbase-master/bin/hbase-daemon.sh start master' +fi +while [ "" != "$( echo get /hbase/master | hbase zkcli 2>&1 | grep 'Node does not exist: /hbase/master')" ] +do + echo Waiting for hbase master to come up + sleep 30 +done +su - hbase -c '/usr/hdp/current/hbase-regionserver/bin/hbase-daemon.sh start regionserver' + +if [ $me -eq 2 ] +then + if [ "$setupdone" = "" ] + then + su - hive -c '/usr/hdp/current/hive-metastore/bin/schematool -initSchema -dbType mysql' + fi + su - hive -c 'nohup /usr/hdp/current/hive-metastore/bin/hive --service metastore >>/var/log/hive/hive.out 2>>/var/log/hive/hive.log </dev/null &' + (cd /bin; wget https://raw.githubusercontent.com/caskdata/cdap-monitoring-tools/develop/nagios/check_cdap/bin/check_cdap) + chmod 755 /bin/check_cdap + wget -qO- $CODE_SOURCE/${CODE_VERSION}-raw/cloud_init/instconsulagentub16.sh >/tmp/cinst.sh + bash /tmp/cinst.sh <<!EOF +{ + "bind_addr": "0.0.0.0", + "client_addr": "0.0.0.0", + "advertise_addr": "$n2", + "data_dir": "/opt/consul/data", + "datacenter": "$DATACENTER", + "http_api_response_headers": { + "Access-Control-Allow-Origin": "*" + }, + "rejoin_after_leave": true, + "server": false, + "ui": false, + "enable_syslog": true, + "log_level": "info", + "service": { + "id": "$REGISTERED_NAME", + "name": "$REGISTERED_NAME", + "address": "$N2", + "port": 11015, + "checks": [ + { + "script": "/bin/check_cdap", + "interval": "60s" + } + ] + } +} +!EOF + for i in $(cd /etc/init.d; echo *cdap*) + do + service $i start + done +fi + +if [ "$setupdone" = "" ] +then + echo setupdone=true >>/etc/clustermembers +fi |