共计 24981 个字符,预计需要花费 63 分钟才能阅读完成。
环境
p5-thhidam-datacle-green02
p5-thhidam-datacle-green01
p5-thhidam-datacle-green03
一、零碎设置(所有主机)
1、操作系统环境
CentOS 7.5.1804,64 位操作系统,没有更新过
[root@localhost tools]# cat /etc/redhat-release
CentOS Linux release 7.5.1804 (Core)
2、敞开防火墙
systemctl stop firewalld.service #进行 firewall
systemctl disable firewalld.service
3、敞开 NetworkManager
systemctl stop NetworkManager
4、敞开 selinux
root@p5-thhidam-datacle-green01 gpAdminLogs]# cat /etc/selinux/config
# This file controls the state of SELinux on the system.
# SELINUX= can take one of these three values:
# enforcing - SELinux security policy is enforced.
# permissive - SELinux prints warnings instead of enforcing.
# disabled - No SELinux policy is loaded.
SELINUX=disabled
# SELINUXTYPE= can take one of three two values:
# targeted - Targeted processes are protected,
# minimum - Modification of targeted policy. Only selected processes are protected.
# mls - Multi Level Security protection.
SELINUXTYPE=targeted
5、配置 /etc/sysctl.conf
[root@p5-thhidam-datacle-green02 ~]# grep -v "#" /etc/sysctl.conf
net.ipv4.ip_forward = 0
net.ipv4.conf.default.rp_filter = 1
net.ipv4.conf.default.accept_source_route = 0
kernel.core_uses_pid = 1
net.ipv4.tcp_syncookies = 1
kernel.msgmnb = 65536
kernel.msgmax = 65536
net.ipv4.conf.all.promote_secondaries = 1
net.ipv4.conf.default.promote_secondaries = 1
net.ipv6.neigh.default.gc_thresh3 = 4096
net.ipv4.neigh.default.gc_thresh3 = 4096
kernel.softlockup_panic = 1
kernel.sysrq = 1
net.ipv6.conf.all.disable_ipv6=0
net.ipv6.conf.default.disable_ipv6=0
net.ipv6.conf.lo.disable_ipv6=0
kernel.numa_balancing = 0
kernel.shmmax = 68719476736
kernel.printk = 5
net.ipv6.conf.all.disable_ipv6 = 1
net.ipv6.conf.default.disable_ipv6 = 1
net.ipv4.neigh.default.gc_stale_time=120
net.ipv4.conf.default.arp_announce = 2
net.ipv4.conf.all.arp_announce=2
net.ipv4.conf.lo.arp_announce=2
net.ipv4.icmp_echo_ignore_broadcasts = 1
net.ipv4.icmp_ignore_bogus_error_responses = 1
net.ipv4.ip_forward = 0
net.ipv4.conf.all.send_redirects = 0
net.ipv4.conf.default.send_redirects = 0
net.ipv4.conf.all.rp_filter = 1
net.ipv4.conf.default.rp_filter = 1
net.ipv4.conf.all.accept_source_route = 0
net.ipv4.conf.default.accept_source_route = 0
kernel.sysrq = 0
kernel.core_uses_pid = 1
net.ipv4.tcp_syncookies = 1
kernel.msgmnb = 65536
kernel.msgmax = 65536
kernel.shmmax = 68719476736
kernel.shmall = 4294967296
net.ipv4.tcp_max_tw_buckets = 6000
net.ipv4.tcp_sack = 1
net.ipv4.tcp_window_scaling = 1
net.ipv4.tcp_rmem = 4096 87380 4194304
net.ipv4.tcp_wmem = 4096 16384 4194304
net.core.wmem_default = 8388608
net.core.rmem_default = 8388608
net.core.rmem_max = 16777216
net.core.wmem_max = 16777216
net.core.netdev_max_backlog = 262144
net.ipv4.tcp_max_orphans = 3276800
net.ipv4.tcp_max_syn_backlog = 262144
net.ipv4.tcp_timestamps = 0
net.ipv4.tcp_synack_retries = 1
net.ipv4.tcp_syn_retries = 1
net.ipv4.tcp_tw_recycle = 1
net.ipv4.tcp_tw_reuse = 1
net.ipv4.tcp_mem = 94500000 915000000 927000000
net.ipv4.tcp_fin_timeout = 1
net.ipv4.tcp_keepalive_time = 1800
net.ipv4.tcp_keepalive_probes = 3
net.ipv4.tcp_keepalive_intvl = 15
net.ipv4.ip_local_port_range = 1024 65000
net.netfilter.nf_conntrack_max=655350
net.netfilter.nf_conntrack_tcp_timeout_established=1200
net.ipv4.conf.all.accept_redirects = 0
net.ipv4.conf.default.accept_redirects = 0
net.ipv4.conf.all.secure_redirects = 0
net.ipv4.conf.default.secure_redirects = 0
vm.max_map_count = 1000000
fs.nr_open = 10000000
fs.file-max = 11000000
net.ipv4.conf.all.arp_filter = 1 ############## 次要是这一条 ###################
6、配置 /etc/security/limits.conf
* soft nofile 65536
* hard nofile 65536
* soft nproc 131072
* hard nproc 131072
7、手动执行命令让参数失效,也能够重启零碎
#sysctl -p
8、批改 /etc/hosts 文件配置主机与 ip 地址的映射
192.xxxx.x.x p5-thhidam-datacle-green01
192.xx.x.x p5-thhidam-datacle-green02
192.x.x.x p5-thhidam-datacle-green03
9、创立 gpadmin 用户
-- 每台服务器都做
groupadd -g 530 gpadmin
useradd -g 530 -u 530 -m -d /data/gpadmin -s /bin/bash gpadmin
chown -R gpadmin:gpadmin /data/gpadmin
echo "gpadmin" | passwd --stdin gpadmin
二、装置和散发
CentOS7.5 部署 Greenplum6.14 集群源码装置
1 联网装置必要的包(所有机器)
[root@p5-thhidam-datacle-green01~]# yum -y install rsync coreutils glib2 lrzsz sysstat e4fsprogs xfsprogs ntp readline-devel zlib zlib-devel openssl openssl-devel pam-devel libxml2-devel libxslt-devel python-devel tcl-devel gcc make smartmontools flex bison perl perl-devel perl-ExtUtils* OpenIPMI-tools openldap openldap-devel logrotate gcc-c++ python-py python-pip libdwarf-devel libzstd-devel yum -y install bzip2-devel libevent-devel apr-devel curl-devel ed python-paramiko python-devel
[root@p5-thhidam-datacle-green01~]# pip3 install --upgrade pip
[root@p5-thhidam-datacle-green01~]# pip3 install lockfile paramiko setuptools epydoc psutil
[root@p5-thhidam-datacle-green01~]# pip3 install --upgrade setuptools
2 master 节点解压代码编译装置 Greenplum
web 拜访下载 https://github.com/greenplum-…
或者:
wget https://github.com/greenplum-db/gpdb/releases/download/6.14.1/6.14.1-src-full.tar.gz
- 编译
[root@p5-thhidam-datacle-green01 gpdb-5.15.1]# ./configure --prefix=/data/gpadmin --with-gssapi --with-pgport=5432 --with-libedit-preferred --with-perl --with-python --with-openssl --with-pam --with-krb5 --with-ldap --with-libxml --enable-cassert --enable-debug --enable-testutils --enable-debugbreak --enable-depend --disable-orca
- make -j8
[root@p5-thhidam-datacle-green01 gpdb-5.15.1]# make -j8
make[2]:Leaving directory `/data/tools/gpdb-5.15.1/gpAux/extensions/gpcloud/bin/gpcheckcloud'make[1]: Leaving directory `/data/tools/gpdb-5.15.1/gpAux/extensions'
make -C gpAux/gpperfmon all
gcc -o gpnetbenchClient gpnetbenchClient.o
make[2]: Leaving directory `/data/tools/gpdb-5.15.1/gpAux/platform/gpnetbench'make[1]: Leaving directory `/data/tools/gpdb-5.15.1/gpAux/platform'
All of Greenplum Database successfully made. Ready to install.
- make install
[root@p5-thhidam-datacle-green01 gpdb-5.15.1]# make install
make -C gpAux/gpperfmon install
make[1]: Entering directory `/data/tools/gpdb-5.15.1/gpAux/gpperfmon'make[2]: Leaving directory `/data/tools/gpdb-5.15.1/gpAux/platform/gpnetbench'
make[1]: Leaving directory `/data/tools/gpdb-5.15.1/gpAux/platform'
Greenplum Database installation complete.
若呈现:则阐明装置胜利。
3. 散发文件
因为只在 master 上装置了 Greenplum,所以上面要将安装包批量发送到每个 slave 机器上,能力算是整个 Greenplum 集群装置了 Greenplum。
先在 master 主节点上创立 GP 的 tar 文件,其中 gpsqlpwd 是装置门路。
[root@p5-thhidam-datacle-green01 gpsql]# chown -R gpadmin:gpadmin /data/gpsql/
[root@p5-thhidam-datacle-green01 gpadmin]# gtar -cvf /data/gpadmin/gp.tar /data/gpsql
上面的操作都是为了连贯所有节点,并将安装包发送到每个节点
在 master 主机,以 gpadmin 用户身份创立以下文本,可在 gpadmin 目录下创立 conf 文件夹,用来放这些启动互信信息
--master 主机须要做
su - gpadmin
mkdir /data/gpadmin/conf
source /data/gpadmin/greenplum_path.sh
ssh-keygen
ssh-copy-id -i p5-thhidam-datacle-green02
ssh-copy-id -i p5-thhidam-datacle-green03
gpssh-exkeys -f /data/gpadmin/conf/all_hosts
**** 记住要用 master 节点 ssh 一下
ssh gpadmin@p5-thhidam-datacle-green02
ssh gpadmin@p5-thhidam-datacle-green02
-
编辑 集群列表
[root@p5-thhidam-datacle-green01 conf]# vim /data/gpadmin/conf/all_hosts p5-thhidam-datacle-green01 p5-thhidam-datacle-green02 p5-thhidam-datacle-green03 [root@p5-thhidam-datacle-green01 conf]# vim /data/gpadmin/conf/seg_hosts p5-thhidam-datacle-green02 p5-thhidam-datacle-green03
装置目录下的 greenplum_path.sh 中保留了运行 Greenplum 的一些环境变量设置,包含 GPdata、PYTHONdata 等设置。
以 gpadmin 身份执行 source 命令失效,之后 gpssh-exkeys 替换密钥
gpadmin@p5-thhidam-datacle-green01 gpsql]$ gpssh-exkeys -f /data/gpadmin/conf/all_hosts
[STEP 1 of 5] create local ID and authorize on local host
[STEP 2 of 5] keyscan all hosts and update known_hosts file
[STEP 3 of 5] authorize current user on remote hosts
... send to p5-thhidam-datacle-green02
***
*** Enter password for p5-thhidam-datacle-green02:
... send to p5-thhidam-datacle-green03
[STEP 4 of 5] determine common authentication file content
[STEP 5 of 5] copy authentication files to all remote hosts
... finished key exchange with p5-thhidam-datacle-green02
... finished key exchange with p5-thhidam-datacle-green03
[INFO] completed successfully
通过 gpscp 命令将之前的压缩包散发到 /conf/seg_hosts 文件配置的 segment 节点
[gpadmin@p5-thhidam-datacle-green01 ~]$ gpscp -f /data/gpadmin/conf/seg_hosts /data/gpadmin/gp.tar =:/data/gpadmin/
查看是否将压缩包散发胜利
[gpadmin@p5-thhidam-datacle-green02 ~]$ ll
total 96780
-rw-r--r--. 1 gpadmin gpadmin 99102720 Apr 26 15:18 gp.tar
[gpadmin@swd2 ~]$ ll
total 96780
-rw-r--r--. 1 gpadmin gpadmin 99102720 Apr 26 15:18 gp.tar
通过 gpssh 协定连贯到 segment 节点时,all_hosts 里有多少机器应该有多少输入
[gpadmin@p5-thhidam-datacle-green01 ~]$ gpssh -f /data/gpadmin/conf/all_hosts
=> pwd
[p5-thhidam-datacle-green01] /data/gpadmin
[p5-thhidam-datacle-green03] /data/gpadmin
[p5-thhidam-datacle-green02] /data/gpadmin
=>
解压之间的安装包
=> gtar -xvf gp.tar
最初创立数据库工作目录
=> pwd
[p5-thhidam-datacle-green01] /data/gpadmin
[p5-thhidam-datacle-green03] /data/gpadmin
[p5-thhidam-datacle-green02] /data/gpadmin
=> mkdir gpdata
[p5-thhidam-datacle-green01]
[p5-thhidam-datacle-green03]
[p5-thhidam-datacle-green02]
=> cd gpdata
[p5-thhidam-datacle-green01]
[p5-thhidam-datacle-green03]
[p5-thhidam-datacle-green02]
=> mkdir gpdatap1 gpdatap2 gpdatam1 gpdatam2 gpmaster
[p5-thhidam-datacle-green01]
[p5-thhidam-datacle-green03]
[p5-thhidam-datacle-green02]
=> ll
[p5-thhidam-datacle-green01] total 20
[p5-thhidam-datacle-green01] drwxrwxr-x 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatam1
[p5-thhidam-datacle-green01] drwxrwxr-x 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatam2
[p5-thhidam-datacle-green01] drwxrwxr-x 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatap1
[p5-thhidam-datacle-green01] drwxrwxr-x 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatap2
[p5-thhidam-datacle-green01] drwxrwxr-x 2 gpadmin gpadmin 4096 Apr 26 15:30 gpmaster
[p5-thhidam-datacle-green03] total 20
[p5-thhidam-datacle-green03] drwxrwxr-x. 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatam1
[p5-thhidam-datacle-green03] drwxrwxr-x. 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatam2
[p5-thhidam-datacle-green03] drwxrwxr-x. 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatap1
[p5-thhidam-datacle-green03] drwxrwxr-x. 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatap2
[p5-thhidam-datacle-green03] drwxrwxr-x. 2 gpadmin gpadmin 4096 Apr 26 15:30 gpmaster
[p5-thhidam-datacle-green02] total 20
[p5-thhidam-datacle-green02] drwxrwxr-x. 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatam1
[p5-thhidam-datacle-green02] drwxrwxr-x. 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatam2
[p5-thhidam-datacle-green02] drwxrwxr-x. 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatap1
[p5-thhidam-datacle-green02] drwxrwxr-x. 2 gpadmin gpadmin 4096 Apr 26 15:30 gpdatap2
[p5-thhidam-datacle-green02] drwxrwxr-x. 2 gpadmin gpadmin 4096 Apr 26 15:30 gpmaster
=>exit
三、初始化和创立数据库
1 配置.bash_profile 环境变量(每台机器都要配置)
[gpadmin@p5-thhidam-datacle-green01 ~]$ vim .bash_profile
# .bash_profile
# Get the aliases and functions
if [-f ~/.bashrc]; then
. ~/.bashrc
fi
# User specific environment and startup programs
PATH=$PATH:$data/.local/bin:$data/bin
export PATH
source /data/gpadmin/greenplum_path.sh
export MASTER_DATA_DIRECTORY=/data/gpadmin/gpadata/gpmaster/gpseg-1
export PGPORT=2346
export PGDATABASE=testDB
让环境变量失效
[gpadmin@p5-thhidam-datacle-green01 ~]$ . ~/.bash_profile
2 同步时钟
》在 gpadmin 下:
- 查看时钟:
[gpadmin@p5-thhidam-datacle-green01 ~]$ gpssh -f /data/gpadmin/conf/all_hosts -v date
[WARN] Reference default values as $MASTER_DATA_DIRECTORY/gpssh.conf could not be found
Using delaybeforesend 0.05 and prompt_validation_timeout 1.0
[Reset ...]
[INFO] login p5-thhidam-datacle-green01
[INFO] login p5-thhidam-datacle-green03
[INFO] login p5-thhidam-datacle-green02
[p5-thhidam-datacle-green01] Fri Apr 26 15:51:13 CST 2019
[p5-thhidam-datacle-green03] Fri Apr 26 15:51:13 CST 2019
[p5-thhidam-datacle-green02] Fri Apr 26 15:51:16 CST 2019
[INFO] completed successfully
[Cleanup...]
- 同步:
[gpadmin@p5-thhidam-datacle-green01 ~]$ gpssh -f /data/gpadmin/conf/all_hosts -v ntpd
[WARN] Reference default values as $MASTER_DATA_DIRECTORY/gpssh.conf could not be found
Using delaybeforesend 0.05 and prompt_validation_timeout 1.0
[Reset ...]
[INFO] login p5-thhidam-datacle-green01
[INFO] login p5-thhidam-datacle-green02
[INFO] login p5-thhidam-datacle-green03
[p5-thhidam-datacle-green01] must be run as root, not uid 1001
[p5-thhidam-datacle-green02] must be run as root, not uid 1001
[p5-thhidam-datacle-green03] must be run as root, not uid 1001
[INFO] completed successfully
3 编写数据库启动参数文件
将装置目录下的 /data/gpsql/docs/cli_help/gpconfigs/gpinitsystem_config 文件 copy 到 /data/gpadmin/conf 目录下,而后编辑,保留如下参数即可,
#vi /data/gpadmin/conf/gpinitsystem_config
文件中增加如下参数:ARRAY_NAME="Greenplum Data Platform"
SEG_PREFIX=gpseg
PORT_BASE=42000
declare -a DATA_DIRECTORY=(/data/gpadmin/gpdata/gpdatap1 /data/gpadmin/gpdata/gpdatap2)
MASTER_HOSTNAME=p5-thhidam-datacle-green01
MASTER_DIRECTORY=/data/gpadmin/gpdata/gpmaster
MASTER_PORT=2346
TRUSTED_SHELL=/usr/bin/ssh
CHECK_POINT_SEGMENTS=8
ENCODING=UNICODE
#### 可选参数,针对 mirror 的参数
MIRROR_PORT_BASE=53000
REPLICATION_PORT_BASE=43000
MIRROR_REPLICATION_PORT_BASE=54000
declare -a MIRROR_DATA_DIRECTORY=(/data/gpadmin/gpdata/gpdatam1 /data/gpadmin/gpdata/gpdatam2)
MACHINE_LIST_FILE=/data/gpadmin/conf/seg_hosts
4 初始化
[gpadmin@p5-thhidam-datacle-green01 ~]$ gpinitsystem -c /data/gpadmin/conf/gpinitsystem_config -a
20190429:15:23:32:096604 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking configuration parameters, please wait...
/bin/mv: try to overwrite ?.data/gpadmin/conf/gpinitsystem_config?. overriding mode 0644 (rw-r--r--)?
.
.
20190429:15:26:07:096604 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-The Master /data/gpadmin/gpdata/gpmaster/gpseg-1/pg_hba.conf post gpinitsystem
20190429:15:26:07:096604 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-has been configured to allow all hosts within this new
20190429:15:26:07:096604 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-array to intercommunicate. Any hosts external to this
20190429:15:26:07:096604 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-new array must be explicitly added to this file
20190429:15:26:07:096604 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Refer to the Greenplum Admin support guide which is
20190429:15:26:07:096604 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-located in the /data/gpsql/docs directory
20190429:15:26:07:096604 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-----------------
失常得话,会呈现
[gpadmin@p5-thhidam-datacle-green01 ~]$ psql -d postgres
psql (8.3.23)
Type "help" for help.
postgres=# select * from gp_segment_configuration ;
dbid | content | role | preferred_role | mode | status | port | hostname | address | replication_port
------+---------+------+----------------+------+--------+-------+----------+---------+------------------
1 | -1 | p | p | s | u | 2346 | p5-thhidam-datacle-green01 | p5-thhidam-datacle-green01 |
2 | 0 | p | p | s | u | 42000 | p5-thhidam-datacle-green01 | p5-thhidam-datacle-green01 | 43000
4 | 2 | p | p | s | u | 42000 | p5-thhidam-datacle-green02 | p5-thhidam-datacle-green02 | 43000
6 | 4 | p | p | s | u | 42000 | p5-thhidam-datacle-green03 | p5-thhidam-datacle-green03 | 43000
3 | 1 | p | p | s | u | 42001 | p5-thhidam-datacle-green01 | p5-thhidam-datacle-green01 | 43001
5 | 3 | p | p | s | u | 42001 | p5-thhidam-datacle-green02 | p5-thhidam-datacle-green02 | 43001
7 | 5 | p | p | s | u | 42001 | p5-thhidam-datacle-green03 | p5-thhidam-datacle-green03 | 43001
8 | 0 | m | m | s | u | 53000 | p5-thhidam-datacle-green02 | p5-thhidam-datacle-green02 | 54000
9 | 1 | m | m | s | u | 53001 | p5-thhidam-datacle-green02 | p5-thhidam-datacle-green02 | 54001
10 | 2 | m | m | s | u | 53000 | p5-thhidam-datacle-green03 | p5-thhidam-datacle-green03 | 54000
11 | 3 | m | m | s | u | 53001 | p5-thhidam-datacle-green03 | p5-thhidam-datacle-green03 | 54001
12 | 4 | m | m | s | u | 53000 | p5-thhidam-datacle-green01 | p5-thhidam-datacle-green01 | 54000
13 | 5 | m | m | s | u | 53001 | p5-thhidam-datacle-green01 | p5-thhidam-datacle-green01 | 54001
(13 rows)
搭建过程中得遇到得问题,记录如下:
谬误 1:
[gpadmin@p5-thhidam-datacle-green01 ~]$ gpinitsystem -c /data/gpadmin/conf/gpinitsystem_config -a
20190426:16:24:59:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking configuration parameters, please wait...
/bin/mv: try to overwrite ?.data/gpadmin/conf/gpinitsystem_config?. overriding mode 0644 (rw-r--r--)?
20190426:16:25:05:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Reading Greenplum configuration file /data/gpadmin/conf/gpinitsystem_config
20190426:16:25:06:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Locale has not been set in /data/gpadmin/conf/gpinitsystem_config, will set to default value
20190426:16:25:06:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Locale set to en_US.utf8
20190426:16:25:06:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-No DATABASE_NAME set, will exit following template1 updates
20190426:16:25:06:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-MASTER_MAX_CONNECT not set, will set to default value 250
20190426:16:25:06:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking configuration parameters, Completed
20190426:16:25:06:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Commencing multi-data checks, please wait...
..
20190426:16:25:06:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Configuring build for standard array
20190426:16:25:06:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Commencing multi-data checks, Completed
20190426:16:25:06:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Building primary segment instance array, please wait...
....
20190426:16:25:10:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Building group mirror array type , please wait...
....
20190426:16:25:14:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking Master host
20190426:16:25:14:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking new segment hosts, please wait...
........
20190426:16:25:31:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking new segment hosts, Completed
20190426:16:25:31:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Building the Master instance database, please wait...
20190426:16:25:46:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Starting the Master in admin mode
20190426:16:25:54:gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[FATAL]:-Unknown host swd2 Script Exiting!
20190426:16:25:54:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[WARN]:-Script has left Greenplum Database in an incomplete state
20190426:16:25:54:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[WARN]:-Run command /bin/bash /data/gpadmin/gpAdminLogs/backout_gpinitsystem_gpadmin_20190426_162459 to remove these changes
20190426:16:25:54:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Start Function BACKOUT_COMMAND
20190426:16:25:54:049694 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-End Function BACKOUT_COMMAND
解决形式:
查看各节点的主机名是否正确,发现 p5-thhidam-datacle-green03 的主机名写成了 swd2, 将其批改后,再次初始化
谬误 2:
[gpadmin@p5-thhidam-datacle-green01 gpmaster]$ gpinitsystem -c /data/gpadmin/conf/gpinitsystem_config -a
20190426:16:35:24:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking configuration parameters, please wait...
/bin/mv: try to overwrite ?.data/gpadmin/conf/gpinitsystem_config?. overriding mode 0644 (rw-r--r--)? y
/bin/mv: cannot move ?.tmp/cluster_tmp_file.51899?.to ?.data/gpadmin/conf/gpinitsystem_config?. Permission denied
20190426:16:35:26:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Reading Greenplum configuration file /data/gpadmin/conf/gpinitsystem_config
20190426:16:35:26:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Locale has not been set in /data/gpadmin/conf/gpinitsystem_config, will set to default value
20190426:16:35:26:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Locale set to en_US.utf8
20190426:16:35:26:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-No DATABASE_NAME set, will exit following template1 updates
20190426:16:35:26:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-MASTER_MAX_CONNECT not set, will set to default value 250
20190426:16:35:26:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking configuration parameters, Completed
20190426:16:35:26:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Commencing multi-data checks, please wait...
..
20190426:16:35:27:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Configuring build for standard array
20190426:16:35:27:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Commencing multi-data checks, Completed
20190426:16:35:27:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Building primary segment instance array, please wait...
....
20190426:16:35:30:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Building group mirror array type , please wait...
....
20190426:16:35:34:051899 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking Master host
20190426:16:35:34:gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[FATAL]:-Found indication of postmaster process on port 2346 on Master host Script Exiting!
解决形式:敞开杀死占用端口 2346 的过程
先查问过程
[gpadmin@p5-thhidam-datacle-green01 ~]$ lsof -i:2346
COMMAND PID USER FD TYPE DEVICE SIZE/OFF NODE NAME
postgres 51235 gpadmin 3u IPv4 111661 0t0 TCP *:redstorm_join (LISTEN)
postgres 51235 gpadmin 4u IPv6 111662 0t0 TCP *:redstorm_join (LISTEN)
而后杀死过程
gpadmin@p5-thhidam-datacle-green01 ~]$ kill -9 51235
谬误三:
[gpadmin@p5-thhidam-datacle-green01 ~]$ gpinitsystem -c /data/gpadmin/conf/gpinitsystem_config -a
20190426:16:41:38:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking configuration parameters, please wait...
/bin/mv: try to overwrite ?.data/gpadmin/conf/gpinitsystem_config?. overriding mode 0644 (rw-r--r--)? y
/bin/mv: cannot move ?.tmp/cluster_tmp_file.52895?.to ?.data/gpadmin/conf/gpinitsystem_config?. Permission denied
20190426:16:41:40:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Reading Greenplum configuration file /data/gpadmin/conf/gpinitsystem_config
20190426:16:41:40:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Locale has not been set in /data/gpadmin/conf/gpinitsystem_config, will set to default value
20190426:16:41:40:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Locale set to en_US.utf8
20190426:16:41:40:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-No DATABASE_NAME set, will exit following template1 updates
20190426:16:41:40:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-MASTER_MAX_CONNECT not set, will set to default value 250
20190426:16:41:40:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking configuration parameters, Completed
20190426:16:41:40:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Commencing multi-data checks, please wait...
..
20190426:16:41:41:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Configuring build for standard array
20190426:16:41:41:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Commencing multi-data checks, Completed
20190426:16:41:41:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Building primary segment instance array, please wait...
....
20190426:16:41:44:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Building group mirror array type , please wait...
....
20190426:16:41:48:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Checking Master host
20190426:16:41:48:052895 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[WARN]:-Have lock file /tmp/.s.PGSQL.2346.lock but no process running on port 2346
20190426:16:41:48:gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[FATAL]:-Found indication of postmaster process on port 2346 on Master host Script Exiting!
解决:删除文件:/tmp/.s.PGSQL.2346.lock
谬误四:
20190429:14:58:52:095181 gpstart:p5-thhidam-datacle-green01:gpadmin-[WARNING]:-Segment instance startup failures reported
20190429:14:58:52:095181 gpstart:p5-thhidam-datacle-green01:gpadmin-[WARNING]:-Failed start 9 of 12 segment instances <<<<<<<<
20190429:14:58:52:095181 gpstart:p5-thhidam-datacle-green01:gpadmin-[WARNING]:-Review /data/gpadmin/gpAdminLogs/gpstart_20190429.log
20190429:14:58:52:095181 gpstart:p5-thhidam-datacle-green01:gpadmin-[INFO]:-----------------------------------------------------
20190429:14:58:52:095181 gpstart:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Commencing parallel segment instance shutdown, please wait...
...
20190429:14:58:57:095181 gpstart:p5-thhidam-datacle-green01:gpadmin-[ERROR]:-gpstart error: Do not have enough valid segments to start the array.
20190429:14:58:57:085332 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[WARN]:
20190429:14:58:57:085332 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[WARN]:-Failed to start Greenplum instance; review gpstart output to
20190429:14:58:57:085332 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[WARN]:- determine why gpstart failed and reinitialize cluster after resolving
20190429:14:58:57:085332 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[WARN]:- issues. Not all initialization tasks have completed so the cluster
20190429:14:58:57:085332 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[WARN]:- should not be used.
20190429:14:58:57:085332 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[WARN]:-gpinitsystem will now try to stop the cluster
20190429:14:58:57:085332 gpinitsystem:p5-thhidam-datacle-green01:gpadmin-[WARN]:
20190429:14:58:58:095823 gpstop:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Starting gpstop with args: -a -l /data/gpadmin/gpAdminLogs -i -d /data/gpadmin/gpdata/gpmaster/gpseg-1
20190429:14:58:58:095823 gpstop:p5-thhidam-datacle-green01:gpadmin-[INFO]:-Gathering information and validating the environment...
20190429:14:58:58:095823 gpstop:p5-thhidam-datacle-green01:gpadmin-[ERROR]:-gpstop error: postmaster.pid file does not exist. is Greenplum instance already stopped?
谬误 5:
[gpadmin@gpp5-thhidam-datacle-green01 ~]$ gpstart
20130815:22:28:28:003675
gpstart:gpmaster:gpadmin-[INFO]:-Starting gpstart with
args:
20130815:22:28:28:003675
gpstart:gpmaster:gpadmin-[INFO]:-Gathering information and
validating the environment...
20130815:22:28:28:003675
gpstart failed. (Reason='[Errno 2] No such file or directory:'/data/gpadmin/gpadata/gpmaster/gpseg-1/postgresql.conf'') exiting...
解决办法:
.bash_profile 文件中增加
export PATH
source /data/gpsql/greenplum_path.sh
export MASTER_DATA_DIRECTORY=/data/gpadmin/gpadata/gpmaster/gpseg-1
export PGPORT=2346
export PGDATABASE=testDB
并让其失效:. ~/.bash_profile
注:一个常见的谬误是有局部节点死活 start 不起来,log 中显示 gpdata 下某某文件夹不存在,事实上是该文件夹下初始化了谬误的文件。尝试 vi /data/gpadmin/.gphostcache 看看缓存的 host 对不对,不对的话批改过去。因为如果在批改 network 文件之前执行过 gpssh-exkeys,可能会在 gphostcache 文件中生成主机名和 hostlist 配置中的名字造成对应关系,而 greenplum 之后不会再批改这个文件,这样的话 gpdata 下就会初始化谬误的节点数据,所以这里是个大坑。
参考链接:
https://www.linuxidc.com/Linu…
https://www.cnblogs.com/chou1…
https://www.linuxidc.com/Linu…
https://blog.csdn.net/seeyouc…
https://blog.csdn.net/weixin_…
https://blog.csdn.net/q936889…