随着公司发展,业务数据量增涨,越来越多的公司都开始利用大数据平台,分析业务,但是大数据平台构建比较复杂,如果完全手动安装(其实非常不方便,组件和版本都要关联对应)。有没有方便一点的安装呢?,有,目前主流大数据平台集成环境安装:分别是CDH 或者Ambari.本文主要介绍CDH 安装。
链接: https://pan.baidu.com/s/1kjgKuk5gKvSSBYWM4lCoKw 密码: wagf
119.101.166.253 172.27.55.96 sc01
119.98.60.170 172.27.177.58 sc02
119.98.64.72 172.27.177.56 sc03
119.98.65.245 172.27.177.57 sc04
119.92.227.70 172.27.177.55 sc05
systemctl stop firewalld
systemctl disable firewalld
iptables -F
提取:cat 1.txt |awk '{print "echo \""$2,$3,"\"",">>/etc/hosts"}'
[root@sc01 ~]# more 1.txt
119.101.166.253 172.27.55.96 sc01
119.98.60.170 172.27.177.58 sc02
119.98.64.72 172.27.177.56 sc03
119.98.65.245 172.27.177.57 sc04
119.92.227.70 172.27.177.55 sc05
[root@sc01 ~]# cat 1.txt |awk '{print "echo \""$2,$3,"\"",">>/etc/hosts"}'
echo "172.27.55.96 sc01 " >>/etc/hosts
echo "172.27.177.58 sc02 " >>/etc/hosts
echo "172.27.177.56 sc03 " >>/etc/hosts
echo "172.27.177.57 sc04 " >>/etc/hosts
echo "172.27.177.55 sc05 " >>/etc/hosts
sed -i 's/SELINUX=enforcing/SELINUX=disabled/' /etc/selinux/config
setenforce 0
echo '*/30 * * * * /usr/sbin/ntpdate cn.pool.ntp.org && hwclock -w && hwclock --systohc >/dev/null 2>&1' >>/var/spool/cron/root
mkdir /usr/java
ln -s /usr/local/jdk1.8 /usr/java/default
systemctl stop cloudera-scm-agent
systemctl start cloudera-scm-agent
mkdir -p /usr/share/java/
下载mysql驱动包https://dev.mysql.com/downloads/connector/j/
重命名不能带版本号
cp mysql-connector-java-5.1.47.jar /usr/share/java/mysql-connector-java.jar
mysql -uroot -pxxxx
Use UTF8 encoding for all custom databases. MySQL and MariaDB must use the MySQL utf8 encoding, not utf8mb4.
create database cmf DEFAULT CHARACTER SET utf8;
create database amon DEFAULT CHARACTER SET utf8;
create database hive DEFAULT CHARACTER SET utf8;
grant all on cmf.* TO 'cmf'@'%' IDENTIFIED BY '123Aa123';
grant all on hive.* TO 'hive'@'%' IDENTIFIED BY '123Aa123';
grant all on amon.* TO 'amon'@'%' IDENTIFIED BY '123Aa123';
flush privileges;
mkdir /opt/cloudera-manager
tar -xzvf cm6.3.1-redhat7.tar.gz -C /opt/cloudera-manager/
cd /opt/cloudera-manager/cm6.3.1/RPMS/x86_64
rpm -ivh cloudera-manager-daemons-6.3.1-1466458.el7.x86_64.rpm --nodeps --force
rpm -ivh cloudera-manager-server-6.3.1-1466458.el7.x86_64.rpm --nodeps --force
cd /opt/cloudera-manager/cm6.3.1/RPMS/x86_64
rpm -ivh cloudera-manager-daemons-6.3.1-1466458.el7.x86_64.rpm --nodeps --force
rpm -ivh cloudera-manager-agent-6.3.1-1466458.el7.x86_64.rpm --nodeps --force
sed -i "s/server_host=localhost/server_host=sc01/g" /etc/cloudera-scm-agent/config.ini
vi /etc/cloudera-scm-server/db.properties
com.cloudera.cmf.db.type=mysql
com.cloudera.cmf.db.host=sc01
com.cloudera.cmf.db.name=cmf
com.cloudera.cmf.db.user=cmf
com.cloudera.cmf.db.password=123Aa123
com.cloudera.cmf.db.setupType=EXTERNAL
yum install -y httpd
mkdir -p /var/www/html/cdh6_parcel
systemctl start httpd
访问地址:http://sc01/cdh6_parcel
systemctl start cloudera-scm-server
cd /var/log/cloudera-scm-server/
systemctl start cloudera-scm-agent
http://sc01:7180/cmf
账号密码:admin/admin
修复透明大页面(主、次)
echo never > /sys/kernel/mm/transparent_hugepage/defrag
echo never > /sys/kernel/mm/transparent_hugepage/enabled
swappiness 设置(主、次)
sysctl vm.swappiness=10
echo 'vm.swappiness=10'>> /etc/sysctl.conf
sudo -u hdfs hadoop fs -mkdir -p /home/spark_conf
sudo -u hdfs hadoop fs -put /opt/cloudera/parcels/CDH/etc/hive/conf.dist/hive-site.xml /home/spark_conf/
1、下面错误主要是JDK原因导致,JDK安装之前写的路径进行安装,避免出现下面问题。
[root@sc01 cdh]# journalctl -xe
Sep 16 10:44:02 sc01 cm-server[20855]: | - a supported version of the Oracle JDK from the Oracle Java web |
Sep 16 10:44:02 sc01 cm-server[20855]: | site: |
Sep 16 10:44:02 sc01 cm-server[20855]: | > http://www.oracle.com/technetwork/java/javase/index.html < |
Sep 16 10:44:02 sc01 cm-server[20855]: | OR |
Sep 16 10:44:02 sc01 cm-server[20855]: | - a supported version of the OpenJDK from your OS vendor. Help for |
Sep 16 10:44:02 sc01 cm-server[20855]: | some OSes are available at: |
Sep 16 10:44:02 sc01 cm-server[20855]: | > http://openjdk.java.net/install/ < |
Sep 16 10:44:02 sc01 cm-server[20855]: | |
Sep 16 10:44:02 sc01 cm-server[20855]: | Cloudera Manager requires Oracle JDK or OpenJDK 1.8 or later. |
Sep 16 10:44:02 sc01 cm-server[20855]: | NOTE: Cloudera Manager will find the Oracle JDK when starting, |
Sep 16 10:44:02 sc01 cm-server[20855]: | regardless of whether you installed the JDK using a binary |
Sep 16 10:44:02 sc01 cm-server[20855]: | installer or the RPM-based installer. |
Sep 16 10:44:02 sc01 cm-server[20855]: +======================================================================+
Sep 16 10:44:02 sc01 systemd[1]: cloudera-scm-server.service: main process exited, code=exited, status=1/FAILURE
Sep 16 10:44:02 sc01 systemd[1]: Unit cloudera-scm-server.service entered failed state.
Sep 16 10:44:02 sc01 systemd[1]: cloudera-scm-server.service failed.
Sep 16 10:44:02 sc01 systemd[1]: cloudera-scm-server.service holdoff time over, scheduling restart.
Sep 16 10:44:02 sc01 systemd[1]: Stopped Cloudera CM Server Service.
-- Subject: Unit cloudera-scm-server.service has finished shutting down
-- Defined-By: systemd
-- Support: http://lists.freedesktop.org/mailman/listinfo/systemd-devel
--
-- Unit cloudera-scm-server.service has finished shutting down.
Sep 16 10:44:02 sc01 systemd[1]: start request repeated too quickly for cloudera-scm-server.service
Sep 16 10:44:02 sc01 systemd[1]: Failed to start Cloudera CM Server Service.
-- Subject: Unit cloudera-scm-server.service has failed
-- Defined-By: systemd
-- Support: http://lists.freedesktop.org/mailman/listinfo/systemd-devel
--
-- Unit cloudera-scm-server.service has failed.
--
-- The result is failed.
Sep 16 10:44:02 sc01 systemd[1]: Unit cloudera-scm-server.service entered failed state.
Sep 16 10:44:02 sc01 systemd[1]: cloudera-scm-server.service failed.
解决:(删除agent目录下面的cm_guid文件,并重启失败节点的agent服务恢复。)
rm -rvf /var/lib/cloudera-scm-agent/cm_guid
service cloudera-scm-agent restart