-- root用户 【所有节点】
-- 添加如下参数:
cat>>/etc/sysctl.conf <<EOF
net.ipv4.tcp_fin_timeout=60
net.ipv4.tcp_retries1=5
net.ipv4.tcp_syn_retries=5
net.sctp.path_max_retrans=10
net.sctp.max_init_retransmits=10
EOF
-- 生效参数
sysctl -p## 执行sysctl -p 时有如下报错,此处选择忽略
sysctl: cannot stat /proc/sys/net/sctp/path_max_retrans: No such file or directory
sysctl: cannot stat /proc/sys/net/sctp/max_init_retransmits: No such file or directory
# 预安装过程根据系统参数配置会有相应提示,请按照提示对应系统参数
1.2.3.2 关闭透明大页
-- root用户 【所有节点】
-- openGauss默认关闭使用transparent_hugepage服务,并将关闭命令写入操作系统启动文件
cat >> /etc/rc.d/rc.local<<EOF
if test -f /sys/kernel/mm/transparent_hugepage/enabled;
then
echo never > /sys/kernel/mm/transparent_hugepage/enabled
fi
if test -f /sys/kernel/mm/transparent_hugepage/defrag;
then
echo never > /sys/kernel/mm/transparent_hugepage/defrag
fi
EOF
-- 查看是否关闭:
cat /sys/kernel/mm/transparent_hugepage/enabled
cat /sys/kernel/mm/transparent_hugepage/defrag
# root 用户 节点一操作-- 设置lib库
export LD_LIBRARY_PATH=/opt/software/openGauss/script/gspylib/clib:$LD_LIBRARY_PATH-- 执行预执行
python3 /opt/software/openGauss/script/gs_preinstall -U omm -G dbgrp -X /opt/software/openGauss/clusterconfig.xml
# 预执行过程中,从日志来看是拷贝了software目录下文件到其它节点,将节点一的scripts下ssh-agent.sh拷贝到其它节点/root/.ssh/目录下,执行完并将其删除,创建了omm用户,每个节点/etc/profile下设置环境变量# 预执行详细执行过程可查看 /opt/gaussdb/log/omm/om 目录下 # 执行过程可查看/opt/gaussdb/log/omm/om 目录下gs_preinstall日志文件gs_preinstall_xxx.log文件-- 预检查执行结果如下
Parsing the configuration file.
Successfully parsed the configuration file.
Installing the tools on the local node.
Successfully installed the tools on the local node.
Are you sure you want to create trust for root (yes/no)?yes -- 输入 yes
Please enter password for root
Password: 输入 root 口令
Successfully created SSH trust for the root permission user.
Setting host ip env
Successfully set host ip env.
Distributing package.
Begin to distribute package to tool path.
Successfully distribute package to tool path.
Begin to distribute package to package path.
Successfully distribute package to package path.
Successfully distributed package.
Are you sure you want to create the user[omm] and create trust for it (yes/no)? yes -- 输入 yes
Please enter password for cluster user.
Password: -- 设置 omm 口令
Please enter password for cluster user again.
Password: -- 再次输入 omm 口令
Generate cluster user password files successfully.
Successfully created [omm] user on all nodes.
Preparing SSH service.
Successfully prepared SSH service.
Installing the tools in the cluster.
Successfully installed the tools in the cluster.
Checking hostname mapping.
Successfully checked hostname mapping.
Creating SSH trust for [omm] user.
Please enter password for current user[omm].
Password: -- 输入 omm 口令
Checking network information.
All nodes in the network are Normal.
Successfully checked network information.
Creating SSH trust.
Creating the local key file.
Successfully created the local key files.
Appending local ID to authorized_keys.
Successfully appended local ID to authorized_keys.
Updating the known_hosts file.
Successfully updated the known_hosts file.
Appending authorized_key on the remote node.
Successfully appended authorized_key on all remote node.
Checking common authentication file content.
Successfully checked common authentication content.
Distributing SSH trust file to all node.
Distributing trust keys file to all node successfully.
Successfully distributed SSH trust file to all node.
Verifying SSH trust on all hosts.
Successfully verified SSH trust on all hosts.
Successfully created SSH trust.
Successfully created SSH trust for [omm] user.
Checking OS software.
Successfully check os software.
Checking OS version.
Successfully checked OS version.
Creating cluster's path.
Successfully created cluster's path.
Set and check OS parameter.
Setting OS parameters.
Successfully set OS parameters.
Warning: Installation environment contains some warning messages.
Please get more details by "/opt/software/openGauss/script/gs_checkos -i A -h opengauss-db1,opengauss-db2,opengauss-db3 --detail".
Set and check OS parameter completed.
Preparing CRON service.
Successfully prepared CRON service.
Setting user environmental variables.
Successfully set user environmental variables.
Setting the dynamic link library.
Successfully set the dynamic link library.
Setting Core file
Successfully set core path.
Setting pssh path
Successfully set pssh path.
Setting Cgroup.
Successfully set Cgroup.
Set ARM Optimization.
No need to set ARM Optimization.
Fixing server package owner.
Setting finish flag.
Successfully set finish flag.
Preinstallation succeeded.
-- 查看预安装结果信息,并根据预检查调整参数
[root@opengauss-db1 ~]# /opt/software/openGauss/script/gs_checkos -i A -h opengauss-db1,opengauss-db2,opengauss-db3 --detail-- 执行结果如下
# 本次测试环境三台服务器,操作系统为 Centos 7.9, 系统内核为 3.10.0-693.el7.x86_64 曾经做过7.6系统的升级
Checking items:
A1. [ OSversionstatus ] : Normal
[opengauss-db3]
centos_7.9.2009_64bit
[opengauss-db2]
centos_7.9.2009_64bit
[opengauss-db1]
centos_7.9.2009_64bit
A2. [ Kernelversionstatus ] : Warning
[opengauss-db1]
3.10.0-957.27.2.el7.x86_64
[opengauss-db2]
3.10.0-1160.76.1.el7.x86_64
[opengauss-db3]
3.10.0-1160.76.1.el7.x86_64
A3. [ Unicodestatus ] : Normal
The values of all unicode are same. The value is "LANG=en_US.UTF-8".
A4. [ Timezonestatus ] : Normal
The informations about all timezones are same. The value is "+0800".
A5. [ Swapmemorystatus ] : Normal
The value about swap memory is correct.
A6. [ Systemcontrolparametersstatus ] : Warning
[opengauss-db1]
Warning reason: variable 'net.ipv4.ip_local_port_range' RealValue '1024 65000' ExpectedValue '26000 65535'.
Check_SysCtl_Parameter warning.
[opengauss-db2]
Warning reason: variable 'net.ipv4.ip_local_port_range' RealValue '1024 65000' ExpectedValue '26000 65535'.
Check_SysCtl_Parameter warning.
[opengauss-db3]
Warning reason: variable 'net.ipv4.ip_local_port_range' RealValue '1024 65000' ExpectedValue '26000 65535'.
Check_SysCtl_Parameter warning.
A7. [ Filesystemconfigurationstatus ] : Warning
[opengauss-db1]
Warning reason: variable 'open files' RealValue '65536' ExpectedValue '1000000'
Warning reason: variable 'max user processes' RealValue '69632' ExpectedValue 'unlimited'
[opengauss-db2]
Warning reason: variable 'open files' RealValue '65536' ExpectedValue '1000000'
Warning reason: variable 'max user processes' RealValue '69632' ExpectedValue 'unlimited'
[opengauss-db3]
Warning reason: variable 'open files' RealValue '65536' ExpectedValue '1000000'
Warning reason: variable 'max user processes' RealValue '69632' ExpectedValue 'unlimited'
A8. [ Diskconfigurationstatus ] : Normal
The value about XFS mount parameters is correct.
A9. [ Pre-readblocksizestatus ] : Normal
The value about Logical block size is correct.
A10.[ IOschedulerstatus ] : Normal
The value of IO scheduler is correct.
A11.[ Networkcardconfigurationstatus ] : Warning
[opengauss-db1]
BondMode Null
Warning reason: network 'ens33''mtu' RealValue '1500' ExpectedValue '8192'-- 可忽略
[opengauss-db2]
BondMode Null
Warning reason: network 'ens33''mtu' RealValue '1500' ExpectedValue '8192'-- 可忽略
[opengauss-db3]
BondMode Null
Warning reason: network 'ens33''mtu' RealValue '1500' ExpectedValue '8192'-- 可忽略
A12.[ Timeconsistencystatus ] : Warning
[opengauss-db1]
The NTPD not detected on machine and local time is "2022-11-09 11:53:23".
[opengauss-db2]
The NTPD not detected on machine and local time is "2022-11-09 11:53:23".
[opengauss-db3]
The NTPD not detected on machine and local time is "2022-11-09 11:53:24".
A13.[ Firewallservicestatus ] : Normal
The firewall service is stopped.
A14.[ THPservicestatus ] : Normal
The THP service is stopped.
Total numbers:14. Abnormal numbers:0. Warning numbers:5.
=============================================================================
-- 根据执行detail命令结果对预检查告警进行调整
-- 预检查过程中遇到的问题可参照 后文 附录 部分
-- 节点一切换到omm用户执行
su - omm
-- 执行如下命令
gs_install -X /opt/software/openGauss/clusterconfig.xml
# 执行过程可查看/opt/gaussdb/log/omm/om及各节点/opt/gaussdb/log/omm/pg_log/ 下日志文件#
[omm@opengauss-db1 ~]$ gs_install -X /opt/software/openGauss/clusterconfig.xml --gsinit-parameter="--encoding=UTF8"-- 执行结果如下
Parsing the configuration file.
Check preinstall on every node.
Successfully checked preinstall on every node.
Creating the backup directory.
Successfully created the backup directory.
begin deploy..
Installing the cluster.
begin prepare Install Cluster..
Checking the installation environment on all nodes.
begin install Cluster..
Installing applications on all nodes.
Successfully installed APP.
begin init Instance..
encrypt cipher and rand files for database.
Please enter password for database: -- 设置数据库 口令 如 Passw0rd@1234
Please repeat for database: -- 再次输入相同口令
begin to create CA cert files
The sslcert will be generated in /opt/gaussdb/install/app/share/sslcert/om
Create CA files for cm beginning.
Create CA files on directory [/opt/gaussdb/install/app_4e931f9a/share/sslcert/cm]. file list: ['client.key.rand', 'server.crt', 'cacert.pem', 'client.crt', 'server.key.rand', 'client.key', 'client.key.cipher', 'server.key', 'server.key.cipher']
Cluster installation is completed.
Configuring.
Deleting instances from all nodes.
Successfully deleted instances from all nodes.
Checking node configuration on all nodes.
Initializing instances on all nodes.
Updating instance configuration on all nodes.
Check consistence of memCheck and coresCheck on database nodes.
Successful check consistence of memCheck and coresCheck on all nodes.
Configuring pg_hba on all nodes.
Configuration is completed.
Starting cluster.
======================================================================
Successfully started primary instance. Wait for standby instance.
======================================================================
.
Successfully started cluster.
======================================================================
cluster_state : Normal
redistributing : No
node_count : 3
Datanode State
primary : 1
standby : 2
secondary : 0
cascade_standby : 0
building : 0
abnormal : 0
down : 0
Successfully installed application.
end deploy..
3.5.3 数据库状态检查
-- omm用户
[omm@opengauss-db1 ~]$ gs_om -t status --detail
[ CMServer State ]
node node_ip instance state
------------------------------------------------------------------------------------1 opengauss-db1 192.168.17.1131/opt/gaussdb/install/data/cm/cm_server Primary2 opengauss-db2 192.168.17.1392/opt/gaussdb/install/data/cm/cm_server Standby
3 opengauss-db3 192.168.17.1593/opt/gaussdb/install/data/cm/cm_server Standby
[ Cluster State ]
cluster_state : Normal
redistributing : No
balanced : Yes
current_az : AZ_ALL
[ Datanode State ]
node node_ip instance state
-------------------------------------------------------------------------------------1 opengauss-db1 192.168.17.1136001/opt/gaussdb/install/data/db1 P Primary Normal
2 opengauss-db2 192.168.17.1396002/opt/gaussdb/install/data/db1 S Standby Normal
3 opengauss-db3 192.168.17.1596003/opt/gaussdb/install/data/db1 S Standby Normal
3.5.4 集群状态检查
-- omm 用户
[omm@opengauss-db1 ~]$ cm_ctl query -Cv
[ CMServerState ]
node instance state
---------------------------------1 opengauss-db11 Primary
2 opengauss-db22 Standby
3 opengauss-db33 Standby
[ ClusterState ]
cluster_state : Normal
redistributing : No
balanced : Yes
current_az : AZ_ALL
[ DatanodeState ]
node instance state | node instance state | node instance state
---------------------------------------------------------------------------------------------------------------------------------------1 opengauss-db16001 P Primary Normal | 2 opengauss-db26002 S Standby Normal | 3 opengauss-db36003 S Standby Normal
四、集群测试
4.1 主备数据验证测试
-- omm用户-- 主节点
[omm@opengauss-db1 ~]$ gsql -d postgres -p 26000
gsql ((openGauss 3.1.0 build 4e931f9a) compiled at2022-09-2914:19:24commit0last mr )
Non-SSL connection (SSL connection is recommended when requiring high-security)
Type "help" for help.
openGauss=# createtable tb1 (id int, name text);
CREATETABLE
openGauss=# insertinto tb1 (id,name) values (10,'Jacky');
INSERT01
openGauss=# commit;
WARNING: there isno transaction in progress
COMMIT
openGauss=# \echo :AUTOCOMMIT -- 默认开启了自动提交on
openGauss=#
-- 备节点一
[omm@opengauss-db2 ~]$ gsql -d postgres -p 26000
gsql ((openGauss 3.1.0 build 4e931f9a) compiled at2022-09-2914:19:24commit0last mr )
Non-SSL connection (SSL connection is recommended when requiring high-security)
Type "help" for help.
openGauss=# select*from tb1;
id | name
----+-------10| Jacky
(1row)
openGauss=# insertinto tb1 (id,name) values (11,'shlei');
ERROR: cannot executeINSERTin a read-only transaction
openGauss=#
-- 备节点二
[omm@opengauss-db3 ~]$ gsql -d postgres -p 26000
gsql ((openGauss 3.1.0 build 4e931f9a) compiled at2022-09-2914:19:24commit0last mr )
Non-SSL connection (SSL connection is recommended when requiring high-security)
Type "help" for help.
openGauss=# select*from tb1;
id | name
----+-------10| Jacky
(1row)
openGauss=# insertinto tb1 (id,name) values (11,'shlei');
ERROR: cannot executeINSERTin a read-only transaction
openGauss=#
4.2 集群启停测试
4.2.1 停止集群
-- omm 用户
-- 停止集群
[omm@opengauss-db1 ~]$ cm_ctl stop
cm_ctl: stop cluster.
cm_ctl: stop nodeid: 1
cm_ctl: stop nodeid: 2
cm_ctl: stop nodeid: 3
..........
cm_ctl: stop cluster successfully.
-- 查看集群状态
[omm@opengauss-db1 ~]$ cm_ctl query -Cv
[ CMServerState ]
node instance state
---------------------------------1 opengauss-db11 Down
2 opengauss-db22 Down
3 opengauss-db33 Down
cm_ctl: can't connect to cm_server.
Maybe cm_server is not running, or timeout expired. Please try again.
4.2.2 启动集群
-- omm 用户
-- 启动集群
[omm@opengauss-db1 ~]$ cm_ctl start
cm_ctl: checking cluster status.
cm_ctl: checking cluster status.
cm_ctl: checking finished in901 ms.
cm_ctl: start cluster.
cm_ctl: start nodeid: 1
cm_ctl: start nodeid: 2
cm_ctl: start nodeid: 3
.................
cm_ctl: start cluster successfully.
-- 查看集群状态
[omm@opengauss-db1 ~]$ cm_ctl query -Cv
[ CMServerState ]
node instance state
---------------------------------1 opengauss-db11 Primary
2 opengauss-db22 Standby
3 opengauss-db33 Standby
[ ClusterState ]
cluster_state : Normal
redistributing : No
balanced : Yes
current_az : AZ_ALL
[ DatanodeState ]
node instance state | node instance state | node instance state
---------------------------------------------------------------------------------------------------------------------------------------1 opengauss-db16001 P Primary Normal | 2 opengauss-db26002 S Standby Normal | 3 opengauss-db36003 S Standby Normal
五、补充
5.1 初始化报expect命令未找到
-- 如未安装expect包导致初始化预检查调用expect命令时报错,报错信息如下:
[2022-11-0911:13:42.081711][2196828][gs_sshexkey][DEBUG]:add ssh id_rsa output:/root/.ssh/./ssh-agent.sh: line 18: expect: command not found
[2022-11-0911:13:42.082355][2196828][gs_sshexkey][DEBUG]:Error: Failed to register other ssh-agent, output is [Failedtossh-addperform.Error: /root/.ssh/./ssh-agent.sh: line18: expect: commandnotfound] for2 times
[2022-11-0911:13:42.082573][2196828][gs_sshexkey][ERROR]:Error: Failed to register other ssh-agent,output is [Failedtossh-addperform.Error: /root/.ssh/./ssh-agent.sh: line18: expect: commandnotfound]
[2022-11-0911:13:42.314059][2196716][gs_preinstall][ERROR]:[GAUSS-51632] : Failed to do gs_sshexkey.Error: Please enter password for current user[root].
-- ssh-agent.sh脚本是openGauss自带脚本,内容为:
#!/bin/bash############################################################################## Copyright (c): 2021-2025, Huawei Tech. Co., Ltd.# FileName : ssh-agent# Version : V1.0.0# Date : 2020-01-13#############################################################################
read -r secret
id_rsa_path="$1"
passwd=$secret
cmd="ssh-add ${id_rsa_path}"
func_remote_execute_cmd()
{
set timeout 5echo"Access Method"echo"ssh-agent command:$cmd"
expect << EOF
spawn $cmd
expect {
"Enter passphrase for *" {send $passwd\n}
}
expect {
"Bad passphrase*" {puts \"failure\";exit2}
eof {puts \"success:eof\"\n }
}
catch wait result
puts \$resultexit [lindex \$result3]
EOF
}
func_remote_execute_cmd
-- 解决办法:使用yum 执行 yum install -y expect后重新执行预执行命令
5.2 初始化报libpython.so文件未找到
# 在预检查过程中,遇到如下一些报错
报错一:
[GAUSS-51400] : Failed to execute the command: rm-rf'/tmp/step_preinstall_file.dat'. Result:{'opengauss-node1': 'Failure', 'opengauss-node2': 'Failure'}.
Error:
[FAILURE] opengauss-node1:
[FAILURE] opengauss-node2:
[GAUSS-52200] : Unable to import module: libpython3.6m.so.1.0: cannot open shared object file: No such file or directory.
-- 解决办法:
重新编译python,或者在其它已编译该python版本环境将libpython3.6m.so.1.0拷贝到当前服务器/usr/lib64 目录下
并在/etc/profile里执行 export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/python3/bin,并source /etc/profile生效
【推荐】国内首个AI IDE,深度理解中文开发场景,立即下载体验Trae
【推荐】编程新体验,更懂你的AI,立即体验豆包MarsCode编程助手
【推荐】抖音旗下AI助手豆包,你的智能百科全书,全免费不限次数
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· 无需6万激活码!GitHub神秘组织3小时极速复刻Manus,手把手教你使用OpenManus搭建本
· C#/.NET/.NET Core优秀项目和框架2025年2月简报
· Manus爆火,是硬核还是营销?
· 终于写完轮子一部分:tcp代理 了,记录一下
· 【杭电多校比赛记录】2025“钉耙编程”中国大学生算法设计春季联赛(1)