@andy2015
2025-01-12T23:07:34.000000Z
字数 4248
阅读 92
大数据湖仓技术
集群机器规划
vim /etc/hosts
192.168.132.64 st.master.node2 sr.fe.node2 ds.master.node2 zk.service.node1192.168.132.211 st.master.node1 sr.fe.node1 ds.worker.node1 ss.query.server zk.service.node2 ds.api.server flink.master.node1192.168.132.212 st.worker.node1 sr.be.node1 ds.worker.node2flink.worker.node1192.168.132.213 st.worker.node2 sr.be.node2 ds.worker.node3 pgsql.db.node flink.worker.node2 flink.master.node2192.168.132.214 st.worker.node3 sr.be.node3 ds.master.node1zk.service.node3 ds.alert.server flink.worker.node3 flink.master.node3
1). 安装PostgreSQL
sudo yum updatesudo yum install postgresql-server postgresql-contribsudo postgresql-setup initdbsudo systemctl start postgresql#sudo systemctl restart postgresqlsudo systemctl enable postgresql#验证sudo -i -u postgrespsqlSELECT rolname,rolpassword FROM pg_authid;ALTER USER postgres WITH PASSWORD 'BT@024';CREATE DATABASE dolphinscheduler;# 修改 {user} 和 {password} 为你希望的用户名和密码#CREATE USER {user} PASSWORD {password};ALTER DATABASE dolphinscheduler OWNER TO postgres;#远程访问find / -name postgresql.confvim postgresql.conflisten_addresses = '*'find / -name pg_hba.confvim pg_hba.confhost all all 0.0.0.0/0 md5sudo systemctl restart postgresql
2). 安装zookeeper
a. 下载安装包:https://www.apache.org/dyn/closer.lua/zookeeper/zookeeper-3.8.4/apache-zookeeper-3.8.4-bin.tar.gz
b. 解压并安装配置
tar -zxvf apache-zookeeper-3.8.4-bin.tar.gzmv apache-zookeeper-3.8.4-bin /opt/zookeeper-3.8.4cd zookeeper-3.8.4/conf/mv zoo_sample.cfg zoo.cfgvim zoo.cfgserver.1=zk.service.node1:2888:3888server.2=zk.service.node2:2888:3888server.3=zk.service.node3:2888:3888
c. 创建zk数据目录并myid文件,内容与zoo.cfg中server.x项中的x对应。
sudo mkdir -p /data/zookeepertouch /data/zookeeper/myidsudo chmod -R 775 /data/zookeeperecho "1" >> /data/zookeeper/myidcd /opt/zookeeper-3.8.4/binsh ./zkServer.sh start
3) Flink安装(可选, 需要配置SSH免登录)
a. Fink: https://nightlies.apache.org/flink/flink-docs-release-1.20/zh/docs/deployment/resource-providers/standalone/overview/
b. Flink-CDC: https://nightlies.apache.org/flink/flink-cdc-docs-release-3.2/zh/docs/deployment/standalone/
c. Yarn集群:集群资源调度
https://www.cnblogs.com/caoweixiong/p/13451038.html
https://nightlies.apache.org/flink/flink-docs-release-1.20/zh/docs/deployment/resource-providers/yarn/
NFS配置参考
服务端:
sudo mkdir -p /data/flink/hasudo yum install nfs-utils rpcbindsudo vi /etc/exports/data/flink/ha *(rw,sync,no_root_squash)/opt/flink *(rw,sync,no_root_squash)sudo systemctl start rpcbindsudo systemctl start nfs-serversudo systemctl enable rpcbindsudo systemctl enable nfs-server
客户端:
sudo yum install nfs-utilssudo mkdir -p /data/flink/hasudo mount 192.168.132.211:/data/flink/ha /data/flink/hasudo mount 192.168.132.211:/data/flink/conf /data/flink/confsudo mount 192.168.132.211:/data/flink/lib /data/flink/lib#取消挂载sudo umount -lf /opt/flink
下载安装包
上传包到服务器各节点解压
tar -zxvf apache-dolphinscheduler-3.1.9-bin.tar.gz
配置用户免密及权限
useradd dsuserecho "dsuser" | passwd --stdin dsusersed -i '$adsuser ALL=(ALL) NOPASSWD: ALL' /etc/sudoerssed -i 's/Defaults requirett/#Defaults requirett/g' /etc/sudoerschown -R dsuser:dsuser dolphinscheduler-3.1.9#配置机器SSH免密登陆su dsuserssh-keygen -t rsa -P '' -f ~/.ssh/id_rsacat ~/.ssh/id_rsa.pub >> ~/.ssh/authorized_keyschmod 600 ~/.ssh/authorized_keysssh-copy-id dsuser@ip#在数据库节点初始化数据库bash tools/bin/upgrade-schema.sh
启动集群
# 一键停止集群所有服务bash ./bin/stop-all.sh# 一键开启集群所有服务bash ./bin/start-all.sh# 启停 Masterbash ./bin/dolphinscheduler-daemon.sh stop master-serverbash ./bin/dolphinscheduler-daemon.sh start master-server# 启停 Workerbash ./bin/dolphinscheduler-daemon.sh start worker-serverbash ./bin/dolphinscheduler-daemon.sh stop worker-server# 启停 Apibash ./bin/dolphinscheduler-daemon.sh start api-serverbash ./bin/dolphinscheduler-daemon.sh stop api-server#启停 Alertbash ./bin/dolphinscheduler-daemon.sh start alert-serverbash ./bin/dolphinscheduler-daemon.sh stop alert-server
浏览器访问地址 http://localhost:12345/dolphinscheduler/ui 即可登录系统 UI。默认的用户名和密码是 admin/dolphinscheduler123