Kubernetes二进制部署(本文可能有错误,学习k8s状态)
Kubernetes二进制部署(本文可能有错误,学习k8s状态)

Kubernetes二进制部署(本文可能有错误,学习k8s状态)

本文环境:VMware创建的虚拟机

操作系统:ubuntu22.04.4

远程连接工具xshell8

主机环境准备

1.主机

主机名ip内容配置(现实系统1t,数据2t)
master14110.0.0.141api-server,control manager,scheduler,etcd2核,4G,60G
master14210.0.0.142api-server,control manager,scheduler,etcd2核,4G,60G
master14310.0.0.143api-server,control manager,scheduler,etcd2核,4G,60G
worker14410.0.0.244kubelet,kube-proxy2核,4G,60G
worker14510.0.0.245kubelet,kube-proxy2核,4G,60G
apiserver-lb14010.0.0.140apiserver的负载均衡器IP地址2核,4G,60G

2.各节点安装常用的软件包

apt update
apt -y install bind9-utils expect rsync jq psmisc net-tools lvm2 vim unzip rename

3.在master141执行

cat >> /etc/hosts <<'EOF'
10.0.0.140 apiserver-lb140
10.0.0.141 master141
10.0.0.142 master142
10.0.0.143 master143
10.0.0.144 worker144
10.0.0.145 worker145
EOF
cat > password_free_login.sh <<'EOF'
#!/bin/bash

ssh-keygen -t rsa -P "" -f /root/.ssh/id_rsa -q

export mypasswd=gshcmy

k8s_host_list=(master142 master143 worker144 worker145)

for i in ${k8s_host_list[@]};do
expect -c "
spawn ssh-copy-id -i /root/.ssh/id_rsa.pub root@$i
  expect {
    \"*yes/no*\" {send \"yes\r\"; exp_continue}
    \"*password*\" {send \"$mypasswd\r\"; exp_continue}
  }"
done
EOF
bash password_free_login.sh
cat > /usr/local/sbin/data_rsync.sh <<'EOF'
#!/bin/bash

if  [ $# -lt 1 ];then
   echo "Usage: $0 /path/to/file(绝对路径) [mode: m|w]"
   exit
fi 

if [ ! -e $1 ];then
    echo "[ $1 ] dir or file not find!"
    exit
fi

fullpath=`dirname $1`

basename=`basename $1`

cd $fullpath

case $2 in
    WORKER_NODE|w)
      K8S_NODE=(master142 master143 worker144 worker145)
      ;;
    MASTER_NODE|m)
      K8S_NODE=(master142 master143)
      ;;
    *)
      K8S_NODE=(master142 master143 worker144 worker145)
     ;;
esac

for host in ${K8S_NODE[@]};do
  tput setaf 2
    echo ===== rsyncing ${host}: $basename =====
    tput setaf 7
    rsync -az $basename  `whoami`@${host}:$fullpath
    if [ $? -eq 0 ];then
      echo "命令执行成功!"
    fi
done
EOF
chmod +x /usr/local/sbin/data_rsync.sh
data_rsync.sh /etc/hosts             #密码是root用户的密码

4.所有节点环境优化

root@master141:~# systemctl disable --now NetworkManager ufw
root@master142:~# systemctl disable --now NetworkManager ufw
root@master143:~# systemctl disable --now NetworkManager ufw
root@master144:~# systemctl disable --now NetworkManager ufw
root@master145:~# systemctl disable --now NetworkManager ufw
下图是撰写栏Xshell 8中位于:查看→撰写→撰写栏  点击下图最左边图标可以选择,下图选择为全部Xshell,使用这个可以不用一个个去写
swapoff -a && sysctl -w vm.swappiness=0
sed -ri '/^[^#]*swap/s@^@#@' /etc/fstab
ln -svf /usr/share/zoneinfo/Asia/Shanghai /etc/localtime
cat >> /etc/security/limits.conf <<'EOF'
* soft nofile 655360
* hard nofile 131072
* soft nproc 655350
* hard nproc 655350
* soft memlock unlimited
* hard memlock unlimited
EOF

每个节点都要执行
sed -i 's@#UseDNS yes@UseDNS no@g' /etc/ssh/sshd_config
sed -i 's@^GSSAPIAuthentication yes@GSSAPIAuthentication no@g' /etc/ssh/sshd_config
cat > /etc/sysctl.d/k8s.conf <<'EOF'
net.ipv4.ip_forward = 1
net.bridge.bridge-nf-call-iptables = 1
net.bridge.bridge-nf-call-ip6tables = 1
net.ipv6.conf.all.disable_ipv6 = 1
fs.may_detach_mounts = 1
vm.overcommit_memory=1
vm.panic_on_oom=0
fs.inotify.max_user_watches=89100
fs.file-max=52706963
fs.nr_open=52706963
net.netfilter.nf_conntrack_max=2310720
net.ipv4.tcp_keepalive_time = 600
net.ipv4.tcp_keepalive_probes = 3
net.ipv4.tcp_keepalive_intvl =15
net.ipv4.tcp_max_tw_buckets = 36000
net.ipv4.tcp_tw_reuse = 1
net.ipv4.tcp_max_orphans = 327680
net.ipv4.tcp_orphan_retries = 3
net.ipv4.tcp_syncookies = 1
net.ipv4.tcp_max_syn_backlog = 16384
net.ipv4.ip_conntrack_max = 65536
net.ipv4.tcp_max_syn_backlog = 16384
net.ipv4.tcp_timestamps = 0
net.core.somaxconn = 16384
EOF

所有节点
sysctl --system
所有节点
cat <<EOF >>  ~/.bashrc
PS1='[\[\e[35;1m\]\u@\[\e[0m\]\[\e[32;1m\]\H\[\e[0m\]\[\e[34;1m\] \W\[\e[0m\]]# '
EOF

修改颜色顺序为紫,绿,蓝
source ~/.bashrc

5.所有节点安装ipvsadm以实现kube-proxy负载均衡

apt -y install ipvsadm ipset sysstat conntrack libseccomp2
cat > /etc/modules-load.d/ipvs.conf << 'EOF'
ip_vs
ip_vs_lc
ip_vs_wlc
ip_vs_rr
ip_vs_wrr
ip_vs_lblc
ip_vs_lblcr
ip_vs_dh
ip_vs_sh
ip_vs_fo
ip_vs_nq
ip_vs_sed
ip_vs_ftp
ip_vs_sh
nf_conntrack
ip_tables
ip_set
xt_set
ipt_set
ipt_rpfilter
ipt_REJECT
ipip
EOF
vim /etc/default/grub
所有节点:下面两个图片是执行的命令和要改的内容,只在二图最后一行
... net.ifnames=0 biosdevname=0
grub-mkconfig -o /boot/grub/grub.cfg
vim /etc/netplan/00-installer-config.yaml       #下面是内容141-145都要
network:
  ethernets:
    eth0:
      dhcp4: false
      addresses:
        - 10.0.0.141/24
      routes:
        - to: default
          via: 10.0.0.2
      nameservers:
        addresses:
          - 223.5.5.5
            # 114 DNS
          - 114.114.114.114
          - 114.114.115.115
            # 阿里云DNS
          - 223.5.5.5
          - 223.6.6.6
            # 腾讯云DNS
          - 119.29.29.29
          - 119.28.28.28
            # 百度DNS
          - 180.76.76.76
            # Google DNS
          - 8.8.8.8
          - 4.4.4.4
  version: 2
reboot
重启
lsmod | grep --color=auto -e ip_vs -e nf_conntrack
uname -r
ifconfig

安装containerd组件 (所有节点)

1.安装系统工具

apt-get -y install apt-transport-https ca-certificates curl software-properties-common

2.安装GPG证书

curl -fsSL https://mirrors.aliyun.com/docker-ce/linux/ubuntu/gpg | apt-key add -

3.写入软件源信息

add-apt-repository "deb [arch=amd64] https://mirrors.aliyun.com/docker-ce/linux/ubuntu $(lsb_release -cs) stable"

4.更新软件源

apt-get update

5.安装containerd组件

apt-get -y install containerd.io

6.配置containerd需要的模块

modprobe -- overlay
modprobe -- br_netfilter
cat > /etc/modules-load.d/containerd.conf <<EOF
overlay
br_netfilter
EOF
所有节点

7.修改containerd的配置文件

containerd config default | tee /etc/containerd/config.toml
sed -ri 's#(SystemdCgroup = )false#\1true#' /etc/containerd/config.toml
grep SystemdCgroup /etc/containerd/config.toml

修改pause的基础镜像名称

sed -i 's#registry.k8s.io/pause:3.6#registry.cn-hangzhou.aliyuncs.com/google_containers/pause:3.7#' /etc/containerd/config.toml
或者
sed -i 's#registry.k8s.io/pause:3.10.1#registry.cn-hangzhou.aliyuncs.com/google_containers/pause:3.7#' /etc/containerd/config.toml

sed -i 's#sandbox =#sandbox_image =#' /etc/containerd/config.toml
grep sandbox_image /etc/containerd/config.toml

所有节点启动

systemctl daemon-reload
systemctl enable --now containerd
systemctl status containerd

cat > /etc/crictl.yaml <<EOF
runtime-endpoint: unix:///run/containerd/containerd.sock
image-endpoint: unix:///run/containerd/containerd.sock
timeout: 10
debug: false
EOF

查看containerd的版本

ctr version

containerd的名称空间,镜像和容器,任务管理

查看当前名称空间

ctr ns ls

名称空间

创建名称空间

ctr ns c gshcmy-k8s
ctr ns ls

删除名称空间(删除的名称空间必须为空,否则无法删除)

ctr ns rm gshcmy-k8s
ctr ns ls

镜像管理

将镜像拉取到名称空间(下方为练习镜像没有的)

ctr ns c gshcmy-k8s
ctr ns ls
ctr image pull registry.cn-hangzhou.aliyuncs.com/gshcmy-k8s/apps:v1
ctr i ls
ctr -n default i ls
ctr  -n gshcmy-k8s i ls
ctr  -n gshcmy-k8s image pull registry.cn-hangzhou.aliyuncs.com/gshcmy-k8s/apps:v2
ctr  -n gshcmy-k8s i ls

删除镜像

ctr -n default i ls
ctr i rm registry.cn-hangzhou.aliyuncs.com/gshcmy-k8s/apps:v1

容器管理

运行容器

ctr -n gshcmy-k8s run registry.cn-hangzhou.aliyuncs.com/gshcmy-k8s/apps:v2 haha

查看容器列表

[root@master141 ~]# ctr -n gshcmy-k8s c ls
CONTAINER    IMAGE                                                        RUNTIME                  
haha         registry.cn-hangzhou.aliyuncs.com/gshcmy-k8s/apps:v2    io.containerd.runc.v2    

查看运行的容器ID

[root@master141 ~]# ctr -n gshcmy-k8s t ls
TASK    PID      STATUS    
haha    19041    RUNNING
[root@master141 ~]# 

连接正在运行的容器

[root@master141 ~]# ctr -n gshcmy-k8s t exec -t --exec-id 2024 haha sh
/ # ifconfig
lo        Link encap:Local Loopback  
          inet addr:127.0.0.1  Mask:255.0.0.0
          inet6 addr: ::1/128 Scope:Host
          UP LOOPBACK RUNNING  MTU:65536  Metric:1
          RX packets:0 errors:0 dropped:0 overruns:0 frame:0
          TX packets:0 errors:0 dropped:0 overruns:0 carrier:0
          collisions:0 txqueuelen:1000 
          RX bytes:0 (0.0 B)  TX bytes:0 (0.0 B)

/ # 

杀死运行的容器

[root@master141 ~]# ctr -n gshcmy-k8s t kill haha
[root@master141 ~]# ctr -n gshcmy-k8s t ls
TASK    PID    STATUS    

删除容器

[root@master141 ~]# ctr -n gshcmy-k8s c ls
CONTAINER    IMAGE                                                        RUNTIME                  
haha         registry.cn-hangzhou.aliyuncs.com/gshcmy-k8s/apps:v2    io.containerd.runc.v2   

[root@master141 ~]# ctr -n gshcmy-k8s c rm haha
[root@master141 ~]# ctr -n gshcmy-k8s c ls
CONTAINER    IMAGE    RUNTIME    

安装etcd程序(需要科学上网)

wget https://github.com/etcd-io/etcd/releases/download/v3.5.14/etcd-v3.5.14-linux-amd64.tar.gz

解压etcd的二进制程序包

tar -xf etcd-v3.5.14-linux-amd64.tar.gz --strip-components=1 -C /usr/local/bin etcd-v3.5.14-linux-amd64/etcd{,ctl}
ll /usr/local/bin/
[root@master141 ~]# etcdctl version     #查看版本
etcdctl version: 3.5.14
API version: 3.5

将软件包下发到所有节点

[root@master141 ~]# data_rsync.sh /usr/local/bin/etcd m
===== rsyncing master142: etcd =====
root@master142's password: 
命令执行成功!
===== rsyncing master143: etcd =====
root@master143's password: 
命令执行成功!
[root@master141 ~]# data_rsync.sh /usr/local/bin/etcdctl m
===== rsyncing master142: etcdctl =====
root@master142's password: 
命令执行成功!
===== rsyncing master143: etcdctl =====
root@master143's password: 
命令执行成功!
[root@master141 ~]# 

安装k8s程序

wget https://dl.k8s.io/v1.30.2/kubernetes-server-linux-amd64.tar.gz

解压K8S的二进制程序包

解压
tar -xf kubernetes-server-linux-amd64.tar.gz  --strip-components=3 -C /usr/local/bin kubernetes/server/bin/kube{let,ctl,-apiserver,-controller-manager,-scheduler,-proxy}

查看版本
[root@master141 ~]# kubelet --version 
Kubernetes v1.30.2
[root@master141 ~]# 

分发软件包
[root@master141 ~]# data_rsync.sh /usr/local/bin/kube-apiserver m
[root@master141 ~]# data_rsync.sh /usr/local/bin/kube-scheduler m
[root@master141 ~]# data_rsync.sh /usr/local/bin/kube-controller-manager m
[root@master141 ~]# data_rsync.sh /usr/local/bin/kubectl m
[root@master141 ~]# data_rsync.sh /usr/local/bin/kubelet w
[root@master141 ~]# data_rsync.sh /usr/local/bin/kube-proxy w

生成etcd证书文件

wget https://github.com/cloudflare/cfssl/releases/download/v1.6.5/cfssl-certinfo_1.6.5_linux_amd64
wget https://github.com/cloudflare/cfssl/releases/download/v1.6.5/cfssljson_1.6.5_linux_amd64
wget https://github.com/cloudflare/cfssl/releases/download/v1.6.5/cfssl_1.6.5_linux_amd64
下载后拍摄快照

重命名cfssl的版本号信息

[root@master141 ~]# ll cfssl*
-rw-r--r-- 1 root root 11890840 Jun 15  2024 cfssl_1.6.5_linux_amd64
-rw-r--r-- 1 root root  8413336 Jun 15  2024 cfssl-certinfo_1.6.5_linux_amd64
-rw-r--r-- 1 root root  6205592 Jun 15  2024 cfssljson_1.6.5_linux_amd64
[root@master141 ~]# rename -v "s/_1.6.5_linux_amd64//g" cfssl*
cfssl_1.6.5_linux_amd64 renamed as cfssl
cfssl-certinfo_1.6.5_linux_amd64 renamed as cfssl-certinfo
cfssljson_1.6.5_linux_amd64 renamed as cfssljson
[root@master141 ~]#
[root@master141 ~]# ll cfssl*
-rw-r--r-- 1 root root 11890840 Jun 15  2024 cfssl
-rw-r--r-- 1 root root  8413336 Jun 15  2024 cfssl-certinfo
-rw-r--r-- 1 root root  6205592 Jun 15  2024 cfssljson

将cfssl证书拷贝到环境变量并授权执行权限

[root@master141 ~]# mv cfssl* /usr/local/bin/
[root@master141 ~]# chmod +x /usr/local/bin/cfssl*
[root@master141 ~]# ll /usr/local/bin/cfssl*
-rwxr-xr-x 1 root root 11890840 Jun 15  2024 /usr/local/bin/cfssl*
-rwxr-xr-x 1 root root  8413336 Jun 15  2024 /usr/local/bin/cfssl-certinfo*
-rwxr-xr-x 1 root root  6205592 Jun 15  2024 /usr/local/bin/cfssljson*

master141节点创建etcd证书存储目录

[root@master141 ~]# mkdir -pv /gshcmy/certs/{etcd,pki}/ && cd /gshcmy/certs/pki/
[root@master141 pki]# cat > etcd-ca-csr.json <<EOF
{
  "CN": "etcd",
  "key": {
    "algo": "rsa",
    "size": 2048
  },
  "names": [
    {
      "C": "CN",
      "ST": "Beijing",
      "L": "Beijing",
      "O": "etcd",
      "OU": "Etcd Security"
    }
  ],
  "ca": {
    "expiry": "876000h"
  }
}
EOF

生成etcd CA证书和CA证书的key

[root@master141 pki]# cfssl gencert -initca etcd-ca-csr.json | cfssljson -bare /gshcmy/certs/etcd/etcd-ca
2025/12/23 16:58:16 [INFO] generating a new CA key and certificate from CSR
2025/12/23 16:58:16 [INFO] generate received request
2025/12/23 16:58:16 [INFO] received CSR
2025/12/23 16:58:16 [INFO] generating key: rsa-2048
2025/12/23 16:58:16 [INFO] encoded CSR
2025/12/23 16:58:16 [INFO] signed certificate with serial number 670358402125359505823061965820939276734710307322
[root@master141 pki]# pwd
/gshcmy/certs/pki
[root@master141 pki]# ll /gshcmy/certs/etcd/
total 20
drwxr-xr-x 2 root root 4096 Dec 23 16:58 ./
drwxr-xr-x 4 root root 4096 Dec 23 16:57 ../
-rw-r--r-- 1 root root 1050 Dec 23 16:58 etcd-ca.csr
-rw------- 1 root root 1675 Dec 23 16:58 etcd-ca-key.pem
-rw-r--r-- 1 root root 1318 Dec 23 16:58 etcd-ca.pem
[root@master141 pki]#

master141节点基于自建ca证书颁发etcd证书

[root@master141 pki]# cat > ca-config.json <<EOF
{
  "signing": {
    "default": {
      "expiry": "876000h"
    },
    "profiles": {
      "kubernetes": {
        "usages": [
            "signing",
            "key encipherment",
            "server auth",
            "client auth"
        ],
        "expiry": "876000h"
      }
    }
  }
}
EOF


[root@master141 pki]# cat > etcd-csr.json <<EOF
{
  "CN": "etcd",
  "key": {
    "algo": "rsa",
    "size": 2048
  },
  "names": [
    {
      "C": "CN",
      "ST": "Beijing",
      "L": "Beijing",
      "O": "etcd",
      "OU": "Etcd Security"
    }
  ]
}
EOF


[root@master141 pki]# cfssl gencert \
  -ca=/gshcmy/certs/etcd/etcd-ca.pem \
  -ca-key=/gshcmy/certs/etcd/etcd-ca-key.pem \
  -config=ca-config.json \
  --hostname=127.0.0.1,master141,master142,master143,10.0.0.141,10.0.0.142,10.0.0.143 \
  --profile=kubernetes \
  etcd-csr.json  | cfssljson -bare /gshcmy/certs/etcd/etcd-server

[root@master141 pki]# ll /gshcmy/certs/etcd/etcd-server*
-rw-r--r-- 1 root root 1119 Dec 23 17:07 /gshcmy/certs/etcd/etcd-server.csr
-rw------- 1 root root 1675 Dec 23 17:07 /gshcmy/certs/etcd/etcd-server-key.pem
-rw-r--r-- 1 root root 1452 Dec 23 17:07 /gshcmy/certs/etcd/etcd-server.pem
[root@master141 pki]# 

master141节点将etcd证书拷贝到其他两个master节点

[root@master141 pki]# MasterNodes='master142 master143'
[root@master141 pki]# for NODE in $MasterNodes; do ssh $NODE "mkdir -pv /gshcmy/certs/etcd/"; done
root@master142's password: 
mkdir: created directory '/gshcmy'
mkdir: created directory '/gshcmy/certs'
mkdir: created directory '/gshcmy/certs/etcd/'
root@master143's password: 
mkdir: created directory '/gshcmy'
mkdir: created directory '/gshcmy/certs'
mkdir: created directory '/gshcmy/certs/etcd/'

[root@master141 pki]# data_rsync.sh /gshcmy/certs/etcd/etcd-ca-key.pem m
===== rsyncing master142: etcd-ca-key.pem =====
root@master142's password: 
命令执行成功!
===== rsyncing master143: etcd-ca-key.pem =====
root@master143's password: 
命令执行成功!
[root@master141 pki]# data_rsync.sh /gshcmy/certs/etcd/etcd-ca.pem m
===== rsyncing master142: etcd-ca.pem =====
root@master142's password: 
命令执行成功!
===== rsyncing master143: etcd-ca.pem =====
root@master143's password: 
命令执行成功!
[root@master141 pki]# data_rsync.sh /gshcmy/certs/etcd/etcd-server-key.pem m
===== rsyncing master142: etcd-server-key.pem =====
root@master142's password: 
命令执行成功!
===== rsyncing master143: etcd-server-key.pem =====
root@master143's password: 
命令执行成功!
[root@master141 pki]# data_rsync.sh /gshcmy/certs/etcd/etcd-server.pem m
===== rsyncing master142: etcd-server.pem =====
root@master142's password: 
命令执行成功!
===== rsyncing master143: etcd-server.pem =====
root@master143's password: 
命令执行成功!

启动etcd集群

创建etcd集群各节点配置文件

[root@master141 ~]# mkdir -pv /gshcmy/softwares/etcd
[root@master141 ~]# cat > /gshcmy/softwares/etcd/etcd.config.yml <<'EOF'
name: 'master141'
data-dir: /var/lib/etcd
wal-dir: /var/lib/etcd/wal
snapshot-count: 5000
heartbeat-interval: 100
election-timeout: 1000
quota-backend-bytes: 0
listen-peer-urls: 'https://10.0.0.141:2380'
listen-client-urls: 'https://10.0.0.141:2379,http://127.0.0.1:2379'
max-snapshots: 3
max-wals: 5
cors:
initial-advertise-peer-urls: 'https://10.0.0.141:2380'
advertise-client-urls: 'https://10.0.0.141:2379'
discovery:
discovery-fallback: 'proxy'
discovery-proxy:
discovery-srv:
initial-cluster: 'master141=https://10.0.0.141:2380,master142=https://10.0.0.142:2380,master143=https://10.0.0.143:2380'
initial-cluster-token: 'etcd-k8s-cluster'
initial-cluster-state: 'new'
strict-reconfig-check: false
enable-v2: true
enable-pprof: true
proxy: 'off'
proxy-failure-wait: 5000
proxy-refresh-interval: 30000
proxy-dial-timeout: 1000
proxy-write-timeout: 5000
proxy-read-timeout: 0
client-transport-security:
  cert-file: '/gshcmy/certs/etcd/etcd-server.pem'
  key-file: '/gshcmy/certs/etcd/etcd-server-key.pem'
  client-cert-auth: true
  trusted-ca-file: '/gshcmy/certs/etcd/etcd-ca.pem'
  auto-tls: true
peer-transport-security:
  cert-file: '/gshcmy/certs/etcd/etcd-server.pem'
  key-file: '/gshcmy/certs/etcd/etcd-server-key.pem'
  peer-client-cert-auth: true
  trusted-ca-file: '/gshcmy/certs/etcd/etcd-ca.pem'
  auto-tls: true
debug: false
log-package-levels:
log-outputs: [default]
force-new-cluster: false
EOF
[root@master142 ~]# mkdir -pv /gshcmy/softwares/etcd
[root@master142 ~]# cat > /gshcmy/softwares/etcd/etcd.config.yml << 'EOF'
name: 'master142'
data-dir: /var/lib/etcd
wal-dir: /var/lib/etcd/wal
snapshot-count: 5000
heartbeat-interval: 100
election-timeout: 1000
quota-backend-bytes: 0
listen-peer-urls: 'https://10.0.0.142:2380'
listen-client-urls: 'https://10.0.0.142:2379,http://127.0.0.1:2379'
max-snapshots: 3
max-wals: 5
cors:
initial-advertise-peer-urls: 'https://10.0.0.142:2380'
advertise-client-urls: 'https://10.0.0.142:2379'
discovery:
discovery-fallback: 'proxy'
discovery-proxy:
discovery-srv:
initial-cluster: 'master141=https://10.0.0.141:2380,master142=https://10.0.0.142:2380,master143=https://10.0.0.143:2380'
initial-cluster-token: 'etcd-k8s-cluster'
initial-cluster-state: 'new'
strict-reconfig-check: false
enable-v2: true
enable-pprof: true
proxy: 'off'
proxy-failure-wait: 5000
proxy-refresh-interval: 30000
proxy-dial-timeout: 1000
proxy-write-timeout: 5000
proxy-read-timeout: 0
client-transport-security:
cert-file: '/gshcmy/certs/etcd/etcd-server.pem'
key-file: '/gshcmy/certs/etcd/etcd-server-key.pem'
client-cert-auth: true
trusted-ca-file: '/gshcmy/certs/etcd/etcd-ca.pem'
auto-tls: true
peer-transport-security:
cert-file: '/gshcmy/certs/etcd/etcd-server.pem'
key-file: '/gshcmy/certs/etcd/etcd-server-key.pem'
peer-client-cert-auth: true
trusted-ca-file: '/gshcmy/certs/etcd/etcd-ca.pem'
auto-tls: true
debug: false
log-package-levels:
log-outputs: [default]
force-new-cluster: false
EOF
[root@master143 ~]# mkdir -pv /gshcmy/softwares/etcd
[root@master143 ~]# cat > /gshcmy/softwares/etcd/etcd.config.yml << 'EOF'
name: 'master143'
data-dir: /var/lib/etcd
wal-dir: /var/lib/etcd/wal
snapshot-count: 5000
heartbeat-interval: 100
election-timeout: 1000
quota-backend-bytes: 0
listen-peer-urls: 'https://10.0.0.143:2380'
listen-client-urls: 'https://10.0.0.143:2379,http://127.0.0.1:2379'
max-snapshots: 3
max-wals: 5
cors:
initial-advertise-peer-urls: 'https://10.0.0.143:2380'
advertise-client-urls: 'https://10.0.0.143:2379'
discovery:
discovery-fallback: 'proxy'
discovery-proxy:
discovery-srv:
initial-cluster: 'master141=https://10.0.0.141:2380,master142=https://10.0.0.142:2380,master143=https://10.0.0.143:2380'
initial-cluster-token: 'etcd-k8s-cluster'
initial-cluster-state: 'new'
strict-reconfig-check: false
enable-v2: true
enable-pprof: true
proxy: 'off'
proxy-failure-wait: 5000
proxy-refresh-interval: 30000
proxy-dial-timeout: 1000
proxy-write-timeout: 5000
proxy-read-timeout: 0
client-transport-security:
  cert-file: '/gshcmy/certs/etcd/etcd-server.pem'
  key-file: '/gshcmy/certs/etcd/etcd-server-key.pem'
  client-cert-auth: true
  trusted-ca-file: '/gshcmy/certs/etcd/etcd-ca.pem'
  auto-tls: true
peer-transport-security:
  cert-file: '/gshcmy/certs/etcd/etcd-server.pem'
  key-file: '/gshcmy/certs/etcd/etcd-server-key.pem'
  peer-client-cert-auth: true
  trusted-ca-file: '/gshcmy/certs/etcd/etcd-ca.pem'
  auto-tls: true
debug: false
log-package-levels:
log-outputs: [default]
force-new-cluster: false
EOF

master[141-143]编写etcd启动脚本(141-143都要有)

cat > /usr/lib/systemd/system/etcd.service <<'EOF'
[Unit]
Description=Gsh cmy's Etcd Service
Documentation=https://coreos.com/etcd/docs/latest/
After=network.target

[Service]
Type=notify
ExecStart=/usr/local/bin/etcd --config-file=/gshcmy/softwares/etcd/etcd.config.yml
Restart=on-failure
RestartSec=10
LimitNOFILE=65536

[Install]
WantedBy=multi-user.target
Alias=etcd3.service
EOF

启动etcd集群

systemctl daemon-reload && systemctl enable --now etcd
systemctl status etcd

查看状态
etcdctl --endpoints="10.0.0.141:2379,10.0.0.142:2379,10.0.0.143:2379" --cacert=/gshcmy/certs/etcd/etcd-ca.pem --cert=/gshcmy/certs/etcd/etcd-server.pem --key=/gshcmy/certs/etcd/etcd-server-key.pem  endpoint status --write-out=table

可以停掉一个节点验证高可用是否成功 systemctl stop etcd

生成k8s组件证书

所有节点(master,worker)创建k8s证书存储目录

mkdir -pv /gshcmy/certs/kubernetes/

master141节点生成kubernetes自建ca证书

1.生成证书的CSR文件: 证书签发请求文件,配置了一些域名,公司,单位
[root@master141 pki]# pwd
/gshcmy/certs/pki

[root@master141 pki]# cat > k8s-ca-csr.json  <<EOF
{
"CN": "kubernetes",
"key": {
  "algo": "rsa",
  "size": 2048
},
"names": [
  {
    "C": "CN",
    "ST": "Beijing",
    "L": "Beijing",
    "O": "Kubernetes",
    "OU": "Kubernetes-manual"
  }
],
"ca": {
  "expiry": "876000h"
}
}
EOF

[root@master141 pki]# cfssl gencert -initca k8s-ca-csr.json | cfssljson -bare /gshcmy/certs/kubernetes/k8s-ca
2025/12/23 21:10:47 [INFO] generating a new CA key and certificate from CSR
2025/12/23 21:10:47 [INFO] generate received request
2025/12/23 21:10:47 [INFO] received CSR
2025/12/23 21:10:47 [INFO] generating key: rsa-2048
2025/12/23 21:10:47 [INFO] encoded CSR
2025/12/23 21:10:47 [INFO] signed certificate with serial number 172725731318857238528414959316294645059717357847

[root@master141 pki]# ll /gshcmy/certs/kubernetes/
total 20
drwxr-xr-x 2 root root 4096 Dec 23 21:10 ./
drwxr-xr-x 5 root root 4096 Dec 23 20:56 ../
-rw-r--r-- 1 root root 1070 Dec 23 21:10 k8s-ca.csr
-rw------- 1 root root 1679 Dec 23 21:10 k8s-ca-key.pem
-rw-r--r-- 1 root root 1363 Dec 23 21:10 k8s-ca.pem

k8s-master01节点基于自建ca证书颁发apiserver相关证书

生成k8s证书的有效期为100年
[root@master141 pki]# cat > k8s-ca-config.json <<EOF
{
  "signing": {
    "default": {
      "expiry": "876000h"
    },
    "profiles": {
      "kubernetes": {
        "usages": [
            "signing",
            "key encipherment",
            "server auth",
            "client auth"
        ],
        "expiry": "876000h"
      }
    }
  }
}
EOF


生成apiserver证书的CSR文件: 证书签发请求文件,配置了一些域名,公司,单位
[root@master141 pki]# cat > apiserver-csr.json <<EOF
{
  "CN": "kube-apiserver",
  "key": {
    "algo": "rsa",
    "size": 2048
  },
  "names": [
    {
      "C": "CN",
      "ST": "Beijing",
      "L": "Beijing",
      "O": "Kubernetes",
      "OU": "Kubernetes-manual"
    }
  ]
}
EOF


自建ca证书生成apiServer的证书文件
[root@master141 pki]# cfssl gencert \
  -ca=/gshcmy/certs/kubernetes/k8s-ca.pem \
  -ca-key=/gshcmy/certs/kubernetes/k8s-ca-key.pem \
  -config=k8s-ca-config.json \
  --hostname=10.200.0.1,10.0.0.140,kubernetes,kubernetes.default,kubernetes.default.svc,kubernetes.default.svc.gshcmy,kubernetes.default.svc.gshcmy.com,master141,master142,master143,worker144,worker145,10.0.0.141,10.0.0.142,10.0.0.143,10.0.0.144,10.0.0.145 \
  --profile=kubernetes \
   apiserver-csr.json  | cfssljson -bare /gshcmy/certs/kubernetes/apiserver

[root@master141 pki]# ll /gshcmy/certs/kubernetes/apiserver*
-rw-r--r-- 1 root root 1301 Dec 23 21:30 /gshcmy/certs/kubernetes/apiserver.csr
-rw------- 1 root root 1675 Dec 23 21:30 /gshcmy/certs/kubernetes/apiserver-key.pem
-rw-r--r-- 1 root root 1696 Dec 23 21:30 /gshcmy/certs/kubernetes/apiserver.pem

"10.200.0.1"为svc网段的第一个地址,需要根据自己的场景稍作修改。
	"10.0.0.240"是负载均衡器的VIP地址。
	"kubernetes,...,kubernetes.default.svc.gshcmy.com"对应的是apiServer解析的A记录。
	"10.0.0.241,...,10.0.0.245"对应的是K8S集群的地址。 

生成第三方组件与apiServer通信的聚合证书

生成聚合证书的用于自建ca的CSR文件
[root@master141 pki]# cat > front-proxy-ca-csr.json <<EOF
{
  "CN": "kubernetes",
  "key": {
     "algo": "rsa",
     "size": 2048
  }
}
EOF


生成聚合证书的自建ca证书
[root@master141 pki]# cfssl gencert -initca front-proxy-ca-csr.json | cfssljson -bare /gshcmy/certs/kubernetes/front-proxy-ca
[root@master141 pki]# ll /gshcmy/certs/kubernetes/front-proxy-ca*
-rw-r--r-- 1 root root  891 Dec 23 21:37 /gshcmy/certs/kubernetes/front-proxy-ca.csr
-rw------- 1 root root 1675 Dec 23 21:37 /gshcmy/certs/kubernetes/front-proxy-ca-key.pem
-rw-r--r-- 1 root root 1094 Dec 23 21:37 /gshcmy/certs/kubernetes/front-proxy-ca.pem

成聚合证书的用于客户端的CSR文件
[root@master141 pki]# cat > front-proxy-client-csr.json <<EOF
{
  "CN": "front-proxy-client",
  "key": {
     "algo": "rsa",
     "size": 2048
  }
}
EOF

4 基于聚合证书的自建ca证书签发聚合证书的客户端证书
[root@master141 pki]# cfssl gencert \
  -ca=/gshcmy/certs/kubernetes/front-proxy-ca.pem \
  -ca-key=/gshcmy/certs/kubernetes/front-proxy-ca-key.pem \
  -config=k8s-ca-config.json \
  -profile=kubernetes \
  front-proxy-client-csr.json | cfssljson -bare /gshcmy/certs/kubernetes/front-proxy-client

[root@master141 pki]# ll /gshcmy/certs/kubernetes/front-proxy-client*
-rw-r--r-- 1 root root  903 Dec 23 22:08 /gshcmy/certs/kubernetes/front-proxy-client.csr
-rw------- 1 root root 1679 Dec 23 22:08 /gshcmy/certs/kubernetes/front-proxy-client-key.pem
-rw-r--r-- 1 root root 1188 Dec 23 22:08 /gshcmy/certs/kubernetes/front-proxy-client.pem

生成controller-manager证书及kubeconfig文件

生成controller-manager的CSR文件
[root@master141 pki]# cat > controller-manager-csr.json <<EOF
{
  "CN": "system:kube-controller-manager",
  "key": {
    "algo": "rsa",
    "size": 2048
  },
  "names": [
    {
      "C": "CN",
      "ST": "Beijing",
      "L": "Beijing",
      "O": "system:kube-controller-manager",
      "OU": "Kubernetes-manual"
    }
  ]
}
EOF

生成controller-manager证书文件
[root@master141 pki]# cfssl gencert \
  -ca=/gshcmy/certs/kubernetes/k8s-ca.pem \
  -ca-key=/gshcmy/certs/kubernetes/k8s-ca-key.pem \
  -config=k8s-ca-config.json \
  -profile=kubernetes \
  controller-manager-csr.json | cfssljson -bare /gshcmy/certs/kubernetes/controller-manager

[root@master141 pki]# ll /gshcmy/certs/kubernetes/controller-manager*
-rw-r--r-- 1 root root 1082 Dec 23 22:20 /gshcmy/certs/kubernetes/controller-manager.csr
-rw------- 1 root root 1675 Dec 23 22:20 /gshcmy/certs/kubernetes/controller-manager-key.pem
-rw-r--r-- 1 root root 1501 Dec 23 22:20 /gshcmy/certs/kubernetes/controller-manager.pem

创建一个kubeconfig目录
[root@master141 pki]# mkdir -pv /gshcmy/certs/kubeconfig

设置一个集群
[root@master141 pki]# kubectl config set-cluster gshcmy-k8s \
  --certificate-authority=/gshcmy/certs/kubernetes/k8s-ca.pem \
  --embed-certs=true \
  --server=https://10.0.0.140:8443 \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-controller-manager.kubeconfig

设置一个用户项
[root@master141 pki]# kubectl config set-credentials system:kube-controller-manager \
  --client-certificate=/gshcmy/certs/kubernetes/controller-manager.pem \
  --client-key=/gshcmy/certs/kubernetes/controller-manager-key.pem \
  --embed-certs=true \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-controller-manager.kubeconfig

设置一个上下文环境
[root@master141 pki]# kubectl config set-context system:kube-controller-manager@kubernetes \
  --cluster=gshcmy-k8s \
  --user=system:kube-controller-manager \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-controller-manager.kubeconfig

使用默认的上下文
[root@master141 pki]# kubectl config use-context system:kube-controller-manager@kubernetes \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-controller-manager.kubeconfig

生成scheduler证书及kubeconfig文件

生成scheduler的CSR文件
[root@master141 pki]# cat > scheduler-csr.json <<EOF
{
  "CN": "system:kube-scheduler",
  "key": {
    "algo": "rsa",
    "size": 2048
  },
  "names": [
    {
      "C": "CN",
      "ST": "Beijing",
      "L": "Beijing",
      "O": "system:kube-scheduler",
      "OU": "Kubernetes-manual"
    }
  ]
}
EOF

生成scheduler证书文件
[root@master141 pki]# cfssl gencert \
  -ca=/gshcmy/certs/kubernetes/k8s-ca.pem \
  -ca-key=/gshcmy/certs/kubernetes/k8s-ca-key.pem \
  -config=k8s-ca-config.json \
  -profile=kubernetes \
  scheduler-csr.json | cfssljson -bare /gshcmy/certs/kubernetes/scheduler

[root@master141 pki]# ll /gshcmy/certs/kubernetes/scheduler*
-rw-r--r-- 1 root root 1058 Dec 23 22:33 /gshcmy/certs/kubernetes/scheduler.csr
-rw------- 1 root root 1675 Dec 23 22:33 /gshcmy/certs/kubernetes/scheduler-key.pem
-rw-r--r-- 1 root root 1476 Dec 23 22:33 /gshcmy/certs/kubernetes/scheduler.pem

设置一个集群
[root@master141 pki]# kubectl config set-cluster gshcmy-k8s \
  --certificate-authority=/gshcmy/certs/kubernetes/k8s-ca.pem \
  --embed-certs=true \
  --server=https://10.0.0.140:8443 \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-scheduler.kubeconfig

设置一个用户项
[root@master141 pki]# kubectl config set-credentials system:kube-scheduler \
  --client-certificate=/gshcmy/certs/kubernetes/scheduler.pem \
  --client-key=/gshcmy/certs/kubernetes/scheduler-key.pem \
  --embed-certs=true \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-scheduler.kubeconfig

设置一个上下文环境
[root@master141 pki]# kubectl config set-context system:kube-scheduler@kubernetes \
  --cluster=gshcmy-k8s \
  --user=system:kube-scheduler \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-scheduler.kubeconfig

使用默认的上下文
[root@master141 pki]# kubectl config use-context system:kube-scheduler@kubernetes \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-scheduler.kubeconfig

配置k8s集群管理员证书及kubeconfig文件

生成管理员的CSR文件
[root@master141 pki]# cat > admin-csr.json <<EOF
{
  "CN": "admin",
  "key": {
    "algo": "rsa",
    "size": 2048
  },
  "names": [
    {
      "C": "CN",
      "ST": "Beijing",
      "L": "Beijing",
      "O": "system:masters",
      "OU": "Kubernetes-manual"
    }
  ]
}
EOF

生成k8s集群管理员证书
[root@master141 pki]# cfssl gencert \
  -ca=/gshcmy/certs/kubernetes/k8s-ca.pem \
  -ca-key=/gshcmy/certs/kubernetes/k8s-ca-key.pem \
  -config=k8s-ca-config.json \
  -profile=kubernetes \
  admin-csr.json | cfssljson -bare /gshcmy/certs/kubernetes/admin

[root@master141 pki]# ll /gshcmy/certs/kubernetes/admin*
-rw-r--r-- 1 root root 1025 Dec 23 22:47 /gshcmy/certs/kubernetes/admin.csr
-rw------- 1 root root 1675 Dec 23 22:47 /gshcmy/certs/kubernetes/admin-key.pem
-rw-r--r-- 1 root root 1444 Dec 23 22:47 /gshcmy/certs/kubernetes/admin.pem

设置一个集群
[root@master141 pki]#  kubectl config set-cluster gshcmy-k8s \
  --certificate-authority=/gshcmy/certs/kubernetes/k8s-ca.pem \
  --embed-certs=true \
  --server=https://10.0.0.140:8443 \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-admin.kubeconfig
  
  
		设置一个用户项
[root@master141 pki]# kubectl config set-credentials kube-admin \
  --client-certificate=/gshcmy/certs/kubernetes/admin.pem \
  --client-key=/gshcmy/certs/kubernetes/admin-key.pem \
  --embed-certs=true \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-admin.kubeconfig
  
		设置一个上下文环境
[root@master141 pki]# kubectl config set-context kube-admin@kubernetes \
  --cluster=gshcmy-k8s \
  --user=kube-admin \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-admin.kubeconfig
  
		使用默认的上下文
[root@master141 pki]# kubectl config use-context kube-admin@kubernetes \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-admin.kubeconfig

创建ServiceAccount

ServiceAccount是k8s一种认证方式,创建ServiceAccount的时候会创建一个与之绑定的secret,这个secret会生成一个token
[root@master141 pki]# openssl genrsa -out /gshcmy/certs/kubernetes/sa.key 2048


基于sa.key创建sa.pub
[root@master141 pki]# openssl rsa -in /gshcmy/certs/kubernetes/sa.key -pubout -out /gshcmy/certs/kubernetes/sa.pub

[root@master141 pki]# ll /gshcmy/certs/kubernetes/sa*
-rw------- 1 root root 1704 Dec 23 22:53 /gshcmy/certs/kubernetes/sa.key
-rw-r--r-- 1 root root  451 Dec 23 22:54 /gshcmy/certs/kubernetes/sa.pub

k8s-master01节点K8S组件证书拷贝到其他两个master节点

k8s-master01节点将etcd证书拷贝到其他两个master节点
[root@master141 pki]# data_rsync.sh /gshcmy/certs/kubernetes m
===== rsyncing master142: kubernetes =====
root@master142's password: 
命令执行成功!
===== rsyncing master143: kubernetes =====
root@master143's password: 
命令执行成功!

[root@master141 pki]# data_rsync.sh /gshcmy/certs/kubeconfig m
===== rsyncing master142: kubeconfig =====
root@master142's password: 
命令执行成功!
===== rsyncing master143: kubeconfig =====
root@master143's password: 
命令执行成功!

其他两个节点验证文件数量是否正确
[root@master142 ~]# ls /gshcmy/certs/kubernetes  | wc -l
23
[root@master142 ~]# ls /gshcmy/certs/kubeconfig | wc -l
3
[root@master143 ~]# ls /gshcmy/certs/kubernetes  | wc -l
23
[root@master143 ~]# ls /gshcmy/certs/kubeconfig | wc -l
3

高可用组件haproxy+keepalived安装

所有master【k8s-master[01-03]】节点安装高可用组件
温馨提示:
	- 对于高可用组件,其实我们也可以单独找两台虚拟机来部署,但我为了节省2台机器,就直接在master节点复用了。
	- 如果在云上安装K8S则无安装高可用组件了,毕竟公有云大部分都是不支持keepalived的,可以直接使用云产品,比如阿里的"SLB",腾讯的"ELB"等SAAS产品;
	- 推荐使用ELB,SLB有回环的问题,也就是SLB代理的服务器不能反向访问SLB,但是腾讯云修复了这个问题;
所有master

apt-get -y install keepalived haproxy
所有master节点配置haproxy
温馨提示:
	- haproxy的负载均衡器监听地址我配置是8443,你可以修改为其他端口,haproxy会用来反向代理各个master组件的地址;
	- 如果你真的修改晴一定注意上面的证书配置的kubeconfig文件,也要一起修改,否则就会出现链接集群失败的问题;
	
	
具体实操:
		2.1 备份配置文件
cp /etc/haproxy/haproxy.cfg{,`date +%F`}


		2.2 所有节点的配置文件内容相同
cat > /etc/haproxy/haproxy.cfg << 'EOF'
global
  maxconn  2000
  ulimit-n  16384
  log  127.0.0.1 local0 err
  stats timeout 30s

defaults
  log global
  mode  http
  option  httplog
  timeout connect 5000
  timeout client  50000
  timeout server  50000
  timeout http-request 15s
  timeout http-keep-alive 15s

frontend monitor-haproxy
  bind *:9999
  mode http
  option httplog
  monitor-uri /ruok

frontend gshcmy-k8s
  bind 0.0.0.0:8443
  bind 127.0.0.1:8443
  mode tcp
  option tcplog
  tcp-request inspect-delay 5s
  default_backend gshcmy-k8s

backend gshcmy-k8s
  mode tcp
  option tcplog
  option tcp-check
  balance roundrobin
  server master141   10.0.0.141:6443 check inter 10s downinter 5s rise 2 fall 2 slowstart 60s maxconn 250 maxqueue 256 weight 100
  server master142   10.0.0.142:6443 check inter 10s downinter 5s rise 2 fall 2 slowstart 60s maxconn 250 maxqueue 256 weight 100
  server master143   10.0.0.143:6443 check inter 10s downinter 5s rise 2 fall 2 slowstart 60s maxconn 250 maxqueue 256 weight 100
EOF

所有master节点配置keepalived
温馨提示:
	- 注意"interface"字段为你的物理网卡的名称,如果你的网卡是ens33,请将"eth0"修改为"ens33"哟;
	- 注意"mcast_src_ip"各master节点的配置均不相同,修改根据实际环境进行修改哟;
	- 注意"virtual_ipaddress"指定的是负载均衡器的VIP地址,这个地址也要和kubeconfig文件的Apiserver地址要一致哟;
	- 注意"script"字段的脚本用于检测后端的apiServer是否健康;
	- 注意"router_id"字段为节点ip,master每个节点配置自己的IP

master141节点创建配置文件
[root@master141 ~]# ifconfig
eth0: flags=4163<UP,BROADCAST,RUNNING,MULTICAST>  mtu 1500
        inet 10.0.0.141  netmask 255.255.255.0  broadcast 10.0.0.255
        inet6 fe80::20c:29ff:feda:2a78  prefixlen 64  scopeid 0x20<link>
        ether 00:0c:29:da:2a:78  txqueuelen 1000  (Ethernet)
        RX packets 87124  bytes 14793699 (14.7 MB)
        RX errors 0  dropped 0  overruns 0  frame 0
        TX packets 87498  bytes 10987285 (10.9 MB)
        TX errors 0  dropped 0 overruns 0  carrier 0  collisions 0

[root@master141 ~]# cat > /etc/keepalived/keepalived.conf <<'EOF'
! Configuration File for keepalived
global_defs {
   router_id 10.0.0.141
}
vrrp_script chk_nginx {
    script "/etc/keepalived/check_port.sh 8443"
    interval 2
    weight -20
}
vrrp_instance VI_1 {
    state MASTER
    interface eth0
    virtual_router_id 251
    priority 100
    advert_int 1
    mcast_src_ip 10.0.0.141
    nopreempt
    authentication {
        auth_type PASS
        auth_pass gshcmy_k8s
    }
    track_script {
         chk_nginx
    }
    virtual_ipaddress {
        10.0.0.140
    }
}
EOF

master142节点创建配置文件
[root@master142 ~]#  ifconfig
eth0: flags=4163<UP,BROADCAST,RUNNING,MULTICAST>  mtu 1500
        inet 10.0.0.142  netmask 255.255.255.0  broadcast 10.0.0.255
        inet6 fe80::20c:29ff:feb2:8da0  prefixlen 64  scopeid 0x20<link>
        ether 00:0c:29:b2:8d:a0  txqueuelen 1000  (Ethernet)
        RX packets 67794  bytes 12957944 (12.9 MB)
        RX errors 0  dropped 0  overruns 0  frame 0
        TX packets 67085  bytes 9454780 (9.4 MB)
        TX errors 0  dropped 0 overruns 0  carrier 0  collisions 0

[root@master142 ~]# cat > /etc/keepalived/keepalived.conf <<EOF
! Configuration File for keepalived
global_defs {
   router_id 10.0.0.142
}
vrrp_script chk_nginx {
    script "/etc/keepalived/check_port.sh 8443"
    interval 2
    weight -20
}
vrrp_instance VI_1 {
    state MASTER
    interface eth0
    virtual_router_id 251
    priority 100
    advert_int 1
    mcast_src_ip 10.0.0.142
    nopreempt
    authentication {
        auth_type PASS
        auth_pass gshcmy_k8s
    }
    track_script {
         chk_nginx
    }
    virtual_ipaddress {
        10.0.0.140
    }
}
EOF

master143节点创建配置文件
[root@master143 ~]# ifconfig
eth0: flags=4163<UP,BROADCAST,RUNNING,MULTICAST>  mtu 1500
        inet 10.0.0.143  netmask 255.255.255.0  broadcast 10.0.0.255
        inet6 fe80::20c:29ff:fe55:5971  prefixlen 64  scopeid 0x20<link>
        ether 00:0c:29:55:59:71  txqueuelen 1000  (Ethernet)
        RX packets 76007  bytes 14125808 (14.1 MB)
        RX errors 0  dropped 0  overruns 0  frame 0
        TX packets 75099  bytes 10609607 (10.6 MB)
        TX errors 0  dropped 0 overruns 0  carrier 0  collisions 0

[root@master143 ~]# cat > /etc/keepalived/keepalived.conf <<EOF
! Configuration File for keepalived
global_defs {
   router_id 10.0.0.143
}
vrrp_script chk_nginx {
    script "/etc/keepalived/check_port.sh 8443"
    interval 2
    weight -20
}
vrrp_instance VI_1 {
    state MASTER
    interface eth0
    virtual_router_id 251
    priority 100
    advert_int 1
    mcast_src_ip 10.0.0.143
    nopreempt
    authentication {
        auth_type PASS
        auth_pass gshcmy_k8s
    }
    track_script {
         chk_nginx
    }
    virtual_ipaddress {
        10.0.0.140
    }
}
EOF

所有keepalived节点创建健康检查脚本(141-143)
cat > /etc/keepalived/check_port.sh <<'EOF'
#!/bin/bash
CHK_PORT=$1
if [ -n "$CHK_PORT" ];then
    PORT_PROCESS=`ss -lt|grep $CHK_PORT|wc -l`
    if [ $PORT_PROCESS -eq 0 ];then
        echo "Port $CHK_PORT Is Not Used,End."
        systemctl stop keepalived
    fi
else
    echo "Check Port Cant Be Empty!"
fi
EOF

给权限(141-143)
chmod +x /etc/keepalived/check_port.sh

启动keepalived服务并验证

启动keepalived服务
systemctl daemon-reload
systemctl enable --now keepalived
systemctl status keepalived

验证服务是否正常

所有master(141-143)
tee -a /etc/sysctl.conf << EOF
net.ipv6.conf.eth0.disable_ipv6 = 1
net.ipv6.conf.all.disable_ipv6 = 1
net.ipv6.conf.default.disable_ipv6 = 1
EOF

sysctl -p

[root@master(141-143) ~]# ip a
1: lo: <LOOPBACK,UP,LOWER_UP> mtu 65536 qdisc noqueue state UNKNOWN group default qlen 1000
    link/loopback 00:00:00:00:00:00 brd 00:00:00:00:00:00
    inet 127.0.0.1/8 scope host lo
       valid_lft forever preferred_lft forever
2: eth0: <BROADCAST,MULTICAST,UP,LOWER_UP> mtu 1500 qdisc fq_codel state UP group default qlen 1000
    link/ether 00:0c:29:da:2a:78 brd ff:ff:ff:ff:ff:ff
    altname enp2s1
    altname ens33
    inet 10.0.0.141/24 brd 10.0.0.255 scope global eth0
       valid_lft forever preferred_lft forever
    inet 10.0.0.140/32 scope global eth0
       valid_lft forever preferred_lft forever
3: tunl0@NONE: <NOARP> mtu 1480 qdisc noop state DOWN group default qlen 1000
    link/ipip 0.0.0.0 brd 0.0.0.0

[root@master141 ~]# ping 10.0.0.140
PING 10.0.0.140 (10.0.0.140) 56(84) bytes of data.
64 bytes from 10.0.0.140: icmp_seq=1 ttl=64 time=0.016 ms
64 bytes from 10.0.0.140: icmp_seq=2 ttl=64 time=0.029 ms

找一个节点停止

[root@master141 ~]# systemctl stop keepalived

[root@master141 ~]# ping 10.0.0.140
PING 10.0.0.140 (10.0.0.140) 56(84) bytes of data.
64 bytes from 10.0.0.140: icmp_seq=1 ttl=64 time=0.697 ms
64 bytes from 10.0.0.140: icmp_seq=2 ttl=64 time=0.529 ms
64 bytes from 10.0.0.140: icmp_seq=3 ttl=64 time=0.504 ms
64 bytes from 10.0.0.140: icmp_seq=4 ttl=64 time=0.338 ms


[root@master141 ~]# ip a
1: lo: <LOOPBACK,UP,LOWER_UP> mtu 65536 qdisc noqueue state UNKNOWN group default qlen 1000
    link/loopback 00:00:00:00:00:00 brd 00:00:00:00:00:00
    inet 127.0.0.1/8 scope host lo
       valid_lft forever preferred_lft forever
2: eth0: <BROADCAST,MULTICAST,UP,LOWER_UP> mtu 1500 qdisc fq_codel state UP group default qlen 1000
    link/ether 00:0c:29:da:2a:78 brd ff:ff:ff:ff:ff:ff
    altname enp2s1
    altname ens33
    inet 10.0.0.141/24 brd 10.0.0.255 scope global eth0
       valid_lft forever preferred_lft forever
3: tunl0@NONE: <NOARP> mtu 1480 qdisc noop state DOWN group default qlen 1000
    link/ipip 0.0.0.0 brd 0.0.0.0

验证vip是否飘逸到其他节点,果不其然,真的飘逸到其他master节点
[root@master143 ~]# ip a
1: lo: <LOOPBACK,UP,LOWER_UP> mtu 65536 qdisc noqueue state UNKNOWN group default qlen 1000
    link/loopback 00:00:00:00:00:00 brd 00:00:00:00:00:00
    inet 127.0.0.1/8 scope host lo
       valid_lft forever preferred_lft forever
2: eth0: <BROADCAST,MULTICAST,UP,LOWER_UP> mtu 1500 qdisc fq_codel state UP group default qlen 1000
    link/ether 00:0c:29:55:59:71 brd ff:ff:ff:ff:ff:ff
    altname enp2s1
    altname ens33
    inet 10.0.0.143/24 brd 10.0.0.255 scope global eth0
       valid_lft forever preferred_lft forever
    inet 10.0.0.140/32 scope global eth0
       valid_lft forever preferred_lft forever
3: tunl0@NONE: <NOARP> mtu 1480 qdisc noop state DOWN group default qlen 1000
    link/ipip 0.0.0.0 brd 0.0.0.0

验证haproxy服务并验证

所有节点启动haproxy服务
systemctl enable --now haproxy 
systemctl restart haproxy 
systemctl status haproxy 

所有节点启动keepalived 
systemctl start keepalived

基于telnet验证haporxy是否正常
[root@k8s-master02 ~]# telnet 10.0.0.140 8443

由于刚才141停止所以要执行下方命令
[root@master141 ~]# ip neigh del 10.0.0.140 dev eth0
[root@master141 ~]# arp -an | grep "10.0.0.140"
[root@master141 ~]# arping -c 2 -I eth0 10.0.0.140
Command 'arping' not found, but can be installed with:
apt install iputils-arping  # version 3:20211215-1ubuntu0.1, or
apt install arping          # version 2.22-1
[root@master141 ~]# arp -an | grep "10.0.0.140"
[root@master141 ~]# telnet 10.0.0.140 8443
Trying 10.0.0.140...
Connected to 10.0.0.140.
Escape character is '^]'.
Connection closed by foreign host.

基于webUI进行验证
[root@master141 ~]# curl http://10.0.0.140:9999/ruok
<html><body><h1>200 OK</h1>
Service ready.
</body></html>

部署ApiServer组件

- "--advertise-address"是对应的master节点的IP地址;
	- "--service-cluster-ip-range"对应的是svc的网段
	- "--service-node-port-range"对应的是svc的NodePort端口范围;
	- "--etcd-servers"指定的是etcd集群地址

配置文件参考链接:
	https://kubernetes.io/zh-cn/docs/reference/command-line-tools-reference/kube-apiserver/

master141节点

创建master141节点的配置文件
cat > /usr/lib/systemd/system/kube-apiserver.service << 'EOF'
[Unit]
Description=gshcmy's Kubernetes API Server
Documentation=https://github.com/kubernetes/kubernetes
After=network.target

[Service]
ExecStart=/usr/local/bin/kube-apiserver \
      --v=2  \
      --bind-address=0.0.0.0  \
      --secure-port=6443  \
      --allow_privileged=true \
      --advertise-address=10.0.0.141 \
      --service-cluster-ip-range=10.200.0.0/16  \
      --service-node-port-range=3000-50000  \
      --etcd-servers=https://10.0.0.141:2379,https://10.0.0.142:2379,https://10.0.0.143:2379 \
      --etcd-cafile=/gshcmy/certs/etcd/etcd-ca.pem  \
      --etcd-certfile=/gshcmy/certs/etcd/etcd-server.pem  \
      --etcd-keyfile=/gshcmy/certs/etcd/etcd-server-key.pem  \
      --client-ca-file=/gshcmy/certs/kubernetes/k8s-ca.pem  \
      --tls-cert-file=/gshcmy/certs/kubernetes/apiserver.pem  \
      --tls-private-key-file=/gshcmy/certs/kubernetes/apiserver-key.pem  \
      --kubelet-client-certificate=/gshcmy/certs/kubernetes/apiserver.pem  \
      --kubelet-client-key=/gshcmy/certs/kubernetes/apiserver-key.pem  \
      --service-account-key-file=/gshcmy/certs/kubernetes/sa.pub  \
      --service-account-signing-key-file=/gshcmy/certs/kubernetes/sa.key \
      --service-account-issuer=https://kubernetes.default.svc.gshcmy.com \
      --kubelet-preferred-address-types=InternalIP,ExternalIP,Hostname  \
      --enable-admission-plugins=NamespaceLifecycle,LimitRanger,ServiceAccount,DefaultStorageClass,DefaultTolerationSeconds,NodeRestriction,ResourceQuota  \
      --authorization-mode=Node,RBAC  \
      --enable-bootstrap-token-auth=true  \
      --requestheader-client-ca-file=/gshcmy/certs/kubernetes/front-proxy-ca.pem  \
      --proxy-client-cert-file=/gshcmy/certs/kubernetes/front-proxy-client.pem  \
      --proxy-client-key-file=/gshcmy/certs/kubernetes/front-proxy-client-key.pem  \
      --requestheader-allowed-names=aggregator  \
      --requestheader-group-headers=X-Remote-Group  \
      --requestheader-extra-headers-prefix=X-Remote-Extra-  \
      --requestheader-username-headers=X-Remote-User

Restart=on-failure
RestartSec=10s
LimitNOFILE=65535

[Install]
WantedBy=multi-user.target
EOF

启动服务
[root@master141 ~]# systemctl daemon-reload && systemctl enable --now kube-apiserver
[root@master141 ~]# systemctl status kube-apiserver
[root@master141 ~]# ss -ntl | grep 6443
LISTEN 0      16384              *:6443             *:*     

master142节点

创建master142节点的配置文件
cat > /usr/lib/systemd/system/kube-apiserver.service << 'EOF'
[Unit]
Description=gshcmy's Kubernetes API Server
Documentation=https://github.com/kubernetes/kubernetes
After=network.target

[Service]
ExecStart=/usr/local/bin/kube-apiserver \
      --v=2  \
      --bind-address=0.0.0.0  \
      --secure-port=6443  \
      --advertise-address=10.0.0.142 \
      --service-cluster-ip-range=10.200.0.0/16  \
      --service-node-port-range=3000-50000  \
      --etcd-servers=https://10.0.0.141:2379,https://10.0.0.142:2379,https://10.0.0.143:2379 \
      --etcd-cafile=/gshcmy/certs/etcd/etcd-ca.pem  \
      --etcd-certfile=/gshcmy/certs/etcd/etcd-server.pem  \
      --etcd-keyfile=/gshcmy/certs/etcd/etcd-server-key.pem  \
      --client-ca-file=/gshcmy/certs/kubernetes/k8s-ca.pem  \
      --tls-cert-file=/gshcmy/certs/kubernetes/apiserver.pem  \
      --tls-private-key-file=/gshcmy/certs/kubernetes/apiserver-key.pem  \
      --kubelet-client-certificate=/gshcmy/certs/kubernetes/apiserver.pem  \
      --kubelet-client-key=/gshcmy/certs/kubernetes/apiserver-key.pem  \
      --service-account-key-file=/gshcmy/certs/kubernetes/sa.pub  \
      --service-account-signing-key-file=/gshcmy/certs/kubernetes/sa.key \
      --service-account-issuer=https://kubernetes.default.svc.gshcmy.com \
      --kubelet-preferred-address-types=InternalIP,ExternalIP,Hostname  \
      --enable-admission-plugins=NamespaceLifecycle,LimitRanger,ServiceAccount,DefaultStorageClass,DefaultTolerationSeconds,NodeRestriction,ResourceQuota  \
      --authorization-mode=Node,RBAC  \
      --enable-bootstrap-token-auth=true  \
      --requestheader-client-ca-file=/gshcmy/certs/kubernetes/front-proxy-ca.pem  \
      --proxy-client-cert-file=/gshcmy/certs/kubernetes/front-proxy-client.pem  \
      --proxy-client-key-file=/gshcmy/certs/kubernetes/front-proxy-client-key.pem  \
      --requestheader-allowed-names=aggregator  \
      --requestheader-group-headers=X-Remote-Group  \
      --requestheader-extra-headers-prefix=X-Remote-Extra-  \
      --requestheader-username-headers=X-Remote-User

Restart=on-failure
RestartSec=10s
LimitNOFILE=65535

[Install]
WantedBy=multi-user.target
EOF

启动服务
启动服务
[root@master142 ~]# systemctl daemon-reload && systemctl enable --now kube-apiserver
[root@master142~]# systemctl status kube-apiserver
[root@master142~]# ss -ntl | grep 6443
LISTEN 0      16384              *:6443             *:*  

master143节点

创建master143节点的配置文件
cat > /usr/lib/systemd/system/kube-apiserver.service << 'EOF'
[Unit]
Description=gshcmy's Kubernetes API Server
Documentation=https://github.com/kubernetes/kubernetes
After=network.target

[Service]
ExecStart=/usr/local/bin/kube-apiserver \
      --v=2  \
      --bind-address=0.0.0.0  \
      --secure-port=6443  \
      --advertise-address=10.0.0.143 \
      --service-cluster-ip-range=10.200.0.0/16  \
      --service-node-port-range=3000-50000  \
      --etcd-servers=https://10.0.0.141:2379,https://10.0.0.142:2379,https://10.0.0.143:2379 \
      --etcd-cafile=/gshcmy/certs/etcd/etcd-ca.pem  \
      --etcd-certfile=/gshcmy/certs/etcd/etcd-server.pem  \
      --etcd-keyfile=/gshcmy/certs/etcd/etcd-server-key.pem  \
      --client-ca-file=/gshcmy/certs/kubernetes/k8s-ca.pem  \
      --tls-cert-file=/gshcmy/certs/kubernetes/apiserver.pem  \
      --tls-private-key-file=/gshcmy/certs/kubernetes/apiserver-key.pem  \
      --kubelet-client-certificate=/gshcmy/certs/kubernetes/apiserver.pem  \
      --kubelet-client-key=/gshcmy/certs/kubernetes/apiserver-key.pem  \
      --service-account-key-file=/gshcmy/certs/kubernetes/sa.pub  \
      --service-account-signing-key-file=/gshcmy/certs/kubernetes/sa.key \
      --service-account-issuer=https://kubernetes.default.svc.gshcmy.com \
      --kubelet-preferred-address-types=InternalIP,ExternalIP,Hostname  \
      --enable-admission-plugins=NamespaceLifecycle,LimitRanger,ServiceAccount,DefaultStorageClass,DefaultTolerationSeconds,NodeRestriction,ResourceQuota  \
      --authorization-mode=Node,RBAC  \
      --enable-bootstrap-token-auth=true  \
      --requestheader-client-ca-file=/gshcmy/certs/kubernetes/front-proxy-ca.pem  \
      --proxy-client-cert-file=/gshcmy/certs/kubernetes/front-proxy-client.pem  \
      --proxy-client-key-file=/gshcmy/certs/kubernetes/front-proxy-client-key.pem  \
      --requestheader-allowed-names=aggregator  \
      --requestheader-group-headers=X-Remote-Group  \
      --requestheader-extra-headers-prefix=X-Remote-Extra-  \
      --requestheader-username-headers=X-Remote-User

Restart=on-failure
RestartSec=10s
LimitNOFILE=65535

[Install]
WantedBy=multi-user.target

启动服务
[root@master143 ~]# systemctl daemon-reload && systemctl enable --now kube-apiserver
[root@master143 ~]# systemctl status kube-apiserver
[root@master143 ~]# ss -ntl | grep 6443
LISTEN 0      16384              *:6443             *:*

部署ControlerManager组件

所有节点(master)创建配置文件
温馨提示:
	- "--cluster-cidr"是Pod的网段地址,我们可以自行修改。

配置文件参考链接:
	https://kubernetes.io/zh-cn/docs/reference/command-line-tools-reference/kube-controller-manager/
所有节点的controller-manager组件配置文件相同: (前提是证书文件存放的位置也要相同哟!)
cat > /usr/lib/systemd/system/kube-controller-manager.service << 'EOF'
[Unit]
Description=gshcmy's Kubernetes Controller Manager
Documentation=https://github.com/kubernetes/kubernetes
After=network.target

[Service]
ExecStart=/usr/local/bin/kube-controller-manager \
      --v=2 \
      --root-ca-file=/gshcmy/certs/kubernetes/k8s-ca.pem \
      --cluster-signing-cert-file=/gshcmy/certs/kubernetes/k8s-ca.pem \
      --cluster-signing-key-file=/gshcmy/certs/kubernetes/k8s-ca-key.pem \
      --service-account-private-key-file=/gshcmy/certs/kubernetes/sa.key \
      --kubeconfig=/gshcmy/certs/kubeconfig/kube-controller-manager.kubeconfig \
      --leader-elect=true \
      --use-service-account-credentials=true \
      --node-monitor-grace-period=40s \
      --node-monitor-period=5s \
      --controllers=*,bootstrapsigner,tokencleaner \
      --allocate-node-cidrs=true \
      --cluster-cidr=10.100.0.0/16 \
      --requestheader-client-ca-file=/gshcmy/certs/kubernetes/front-proxy-ca.pem \
      --node-cidr-mask-size=24

Restart=always
RestartSec=10s

[Install]
WantedBy=multi-user.target
EOF

启动controller-manager服务
systemctl daemon-reload
systemctl enable --now kube-controller-manager
systemctl  status kube-controller-manager
ss -ntl | grep 10257

部署Scheduler组件

配置文件参考链接:
	https://kubernetes.io/zh-cn/docs/reference/command-line-tools-reference/kube-scheduler/
所有节点(master)创建配置文件
所有节点的controller-manager组件配置文件相同: (前提是证书文件存放的位置也要相同)
cat > /usr/lib/systemd/system/kube-scheduler.service <<'EOF'
[Unit]
Description=gshcmy's Kubernetes Scheduler
Documentation=https://github.com/kubernetes/kubernetes
After=network.target

[Service]
ExecStart=/usr/local/bin/kube-scheduler \
      --v=2 \
      --leader-elect=true \
      --kubeconfig=/gshcmy/certs/kubeconfig/kube-scheduler.kubeconfig

Restart=always
RestartSec=10s

[Install]
WantedBy=multi-user.target
EOF

启动scheduler服务
systemctl daemon-reload
systemctl enable --now kube-scheduler
systemctl  status kube-scheduler
ss -ntl | grep 10259
LISTEN 0      16384              *:10259            *:*

创建Bootstrapping自动颁发kubelet证书配置

master141节点创建bootstrap-kubelet.kubeconfig文件
温馨提示:
	- "--server"只想的是负载均衡器的IP地址,由负载均衡器对master节点进行反向代理哟。
	- "--token"也可以自定义,但也要同时修改"bootstrap"的Secret的"token-id"和"token-secret"对应值;
设置集群master141

kubectl config set-cluster gshcmy-k8s \
  --certificate-authority=/gshcmy/certs/kubernetes/k8s-ca.pem \
  --embed-certs=true \
  --server=https://10.0.0.140:8443 \
  --kubeconfig=/gshcmy/certs/kubeconfig/bootstrap-kubelet.kubeconfig

创建用户
kubectl config set-credentials tls-bootstrap-token-user  \
  --token=gshcmy.gshcmy \
  --kubeconfig=/gshcmy/certs/kubeconfig/bootstrap-kubelet.kubeconfig

将集群和用户进行绑定
kubectl config set-context tls-bootstrap-token-user@kubernetes \
  --cluster=gshcmy-k8s \
  --user=tls-bootstrap-token-user \
  --kubeconfig=/gshcmy/certs/kubeconfig/bootstrap-kubelet.kubeconfig

配置默认的上下文
kubectl config use-context tls-bootstrap-token-user@kubernetes \
  --kubeconfig=/gshcmy/certs/kubeconfig/bootstrap-kubelet.kubeconfig

所有master节点拷贝管理证书

所有master都拷贝管理员的证书文件
[root@master141-143 ~]# mkdir -p /root/.kube
[root@master141-143 ~]# cp /gshcmy/certs/kubeconfig/kube-admin.kubeconfig /root/.kube/config
[root@master141-143~]# kubectl get cs
Warning: v1 ComponentStatus is deprecated in v1.19+
NAME                 STATUS    MESSAGE   ERROR
controller-manager   Healthy   ok        
etcd-0               Healthy   ok        
scheduler            Healthy   ok
scheduler            Healthy   ok

查看集群状态,如果未来cs组件移除了也没关系,我们可以使用"cluster-info"子命令查看集群状态
[root@master141 ~]# kubectl cluster-info
Kubernetes control plane is running at https://10.0.0.140:8443

To further debug and diagnose cluster problems, use 'kubectl cluster-info dump'.

创建bootstrap-secret授权

创建配bootstrap-secret文件用于授权
cat > bootstrap-secret.yaml <<EOF
apiVersion: v1
kind: Secret
metadata:
  name: bootstrap-token-gshcmy
  namespace: kube-system
type: bootstrap.kubernetes.io/token
stringData:
  description: "The default bootstrap token generated by 'kubelet '."
  token-id: gshcmy
  token-secret: gshcmy
  usage-bootstrap-authentication: "true"
  usage-bootstrap-signing: "true"
  auth-extra-groups:  system:bootstrappers:default-node-token,system:bootstrappers:worker,system:bootstrappers:ingress
 
---
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRoleBinding
metadata:
  name: kubelet-bootstrap
roleRef:
  apiGroup: rbac.authorization.k8s.io
  kind: ClusterRole
  name: system:node-bootstrapper
subjects:
- apiGroup: rbac.authorization.k8s.io
  kind: Group
  name: system:bootstrappers:default-node-token
---
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRoleBinding
metadata:
  name: node-autoapprove-bootstrap
roleRef:
  apiGroup: rbac.authorization.k8s.io
  kind: ClusterRole
  name: system:certificates.k8s.io:certificatesigningrequests:nodeclient
subjects:
- apiGroup: rbac.authorization.k8s.io
  kind: Group
  name: system:bootstrappers:default-node-token
---
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRoleBinding
metadata:
  name: node-autoapprove-certificate-rotation
roleRef:
  apiGroup: rbac.authorization.k8s.io
  kind: ClusterRole
  name: system:certificates.k8s.io:certificatesigningrequests:selfnodeclient
subjects:
- apiGroup: rbac.authorization.k8s.io
  kind: Group
  name: system:nodes
---
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRole
metadata:
  annotations:
    rbac.authorization.kubernetes.io/autoupdate: "true"
  labels:
    kubernetes.io/bootstrapping: rbac-defaults
  name: system:kube-apiserver-to-kubelet
rules:
  - apiGroups:
      - ""
    resources:
      - nodes/proxy
      - nodes/stats
      - nodes/log
      - nodes/spec
      - nodes/metrics
    verbs:
      - "*"
---
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRoleBinding
metadata:
  name: system:kube-apiserver
  namespace: ""
roleRef:
  apiGroup: rbac.authorization.k8s.io
  kind: ClusterRole
  name: system:kube-apiserver-to-kubelet
subjects:
  - apiGroup: rbac.authorization.k8s.io
    kind: User
    name: kube-apiserver
EOF

应用bootstrap-secret配置文件
[root@master141 ~]# kubectl apply -f bootstrap-secret.yaml
secret/bootstrap-token-gshcmy created
clusterrolebinding.rbac.authorization.k8s.io/kubelet-bootstrap created
clusterrolebinding.rbac.authorization.k8s.io/node-autoapprove-bootstrap created
clusterrolebinding.rbac.authorization.k8s.io/node-autoapprove-certificate-rotation created
clusterrole.rbac.authorization.k8s.io/system:kube-apiserver-to-kubelet created
clusterrolebinding.rbac.authorization.k8s.io/system:kube-apiserver created

部署worker节点之kubelet启动实战

复制证书

 k8s-master01节点分发证书到其他节点
[root@master141 ~]# cd /gshcmy/certs/
for NODE in master142 master143 worker144 worker145; do
     echo $NODE
     ssh $NODE "mkdir -p /gshcmy/certs/kube{config,rnetes}"
     for FILE in k8s-ca.pem k8s-ca-key.pem front-proxy-ca.pem; do
       scp kubernetes/$FILE $NODE:/gshcmy/certs/kubernetes/${FILE}
         done
     scp kubeconfig/bootstrap-kubelet.kubeconfig $NODE:/gshcmy/certs/kubeconfig/
done

worker节点验证

[root@worker145 certs]# ll /gshcmy/ -R
/gshcmy/:
total 12
drwxr-xr-x  3 root root 4096 Dec 23 20:56 ./
drwxr-xr-x 21 root root 4096 Dec 23 20:56 ../
drwxr-xr-x  4 root root 4096 Dec 24 21:38 certs/

/gshcmy/certs:
total 16
drwxr-xr-x 4 root root 4096 Dec 24 21:38 ./
drwxr-xr-x 3 root root 4096 Dec 23 20:56 ../
drwxr-xr-x 2 root root 4096 Dec 24 21:40 kubeconfig/
drwxr-xr-x 2 root root 4096 Dec 24 21:40 kubernetes/

/gshcmy/certs/kubeconfig:
total 12
drwxr-xr-x 2 root root 4096 Dec 24 21:40 ./
drwxr-xr-x 4 root root 4096 Dec 24 21:38 ../
-rw------- 1 root root 2223 Dec 24 21:40 bootstrap-kubelet.kubeconfig

/gshcmy/certs/kubernetes:
total 20
drwxr-xr-x 2 root root 4096 Dec 24 21:40 ./
drwxr-xr-x 4 root root 4096 Dec 24 21:38 ../
-rw-r--r-- 1 root root 1094 Dec 24 21:40 front-proxy-ca.pem
-rw------- 1 root root 1679 Dec 24 21:40 k8s-ca-key.pem
-rw-r--r-- 1 root root 1363 Dec 24 21:40 k8s-ca.pem

启动kubelet服务

- 在"10-kubelet.con"文件中使用"--kubeconfig"指定的"kubelet.kubeconfig"文件并不存在,这个证书文件后期会自动生成;
	- 对于"clusterDNS"是NDS地址,我们可以自定义,比如"10.200.0.154";
	- “clusterDomain”对应的是域名信息,要和我们设计的集群保持一致,比如"gshcmy.com";
	- "10-kubelet.conf"文件中的"ExecStart="需要写2次,否则可能无法启动kubelet;
所有节点创建工作目录(master,worker)
mkdir -p /var/lib/kubelet /var/log/kubernetes /etc/systemd/system/kubelet.service.d /etc/kubernetes/manifests/


cat > /etc/kubernetes/kubelet-conf.yml <<'EOF'
apiVersion: kubelet.config.k8s.io/v1beta1
kind: KubeletConfiguration
address: 0.0.0.0
port: 10250
readOnlyPort: 10255
authentication:
  anonymous:
    enabled: false
  webhook:
    cacheTTL: 2m0s
    enabled: true
  x509:
    clientCAFile: /gshcmy/certs/kubernetes/k8s-ca.pem
authorization:
  mode: Webhook
  webhook:
    cacheAuthorizedTTL: 5m0s
    cacheUnauthorizedTTL: 30s
cgroupDriver: systemd
cgroupsPerQOS: true
clusterDNS:
- 10.200.0.254
clusterDomain: gshcmy.com
containerLogMaxFiles: 5
containerLogMaxSize: 10Mi
contentType: application/vnd.kubernetes.protobuf
cpuCFSQuota: true
cpuManagerPolicy: none
cpuManagerReconcilePeriod: 10s
enableControllerAttachDetach: true
enableDebuggingHandlers: true
enforceNodeAllocatable:
- pods
eventBurst: 10
eventRecordQPS: 5
evictionHard:
  imagefs.available: 15%
  memory.available: 100Mi
  nodefs.available: 10%
  nodefs.inodesFree: 5%
evictionPressureTransitionPeriod: 5m0s
failSwapOn: true
fileCheckFrequency: 20s
hairpinMode: promiscuous-bridge
healthzBindAddress: 127.0.0.1
healthzPort: 10248
httpCheckFrequency: 20s
imageGCHighThresholdPercent: 85
imageGCLowThresholdPercent: 80
imageMinimumGCAge: 2m0s
iptablesDropBit: 15
iptablesMasqueradeBit: 14
kubeAPIBurst: 10
kubeAPIQPS: 5
makeIPTablesUtilChains: true
maxOpenFiles: 1000000
maxPods: 110
nodeStatusUpdateFrequency: 10s
oomScoreAdj: -999
podPidsLimit: -1
registryBurst: 10
registryPullQPS: 5
resolvConf: /etc/resolv.conf
rotateCertificates: true
runtimeRequestTimeout: 2m0s
serializeImagePulls: true
staticPodPath: /etc/kubernetes/manifests
streamingConnectionIdleTimeout: 4h0m0s
syncFrequency: 1m0s
volumeStatsAggPeriod: 1m0s
EOF

所有节点配置kubelet service
cat >  /usr/lib/systemd/system/kubelet.service <<'EOF'
[Unit]
Description=gshcmy's Kubernetes Kubelet
Documentation=https://github.com/kubernetes/kubernetes
After=containerd.service
Requires=containerd.service

[Service]
ExecStart=/usr/local/bin/kubelet
Restart=always
StartLimitInterval=0
RestartSec=10

[Install]
WantedBy=multi-user.target
EOF

所有节点配置kubelet service的配置文件
cat > /etc/systemd/system/kubelet.service.d/10-kubelet.conf <<'EOF'
[Service]
Environment="KUBELET_KUBECONFIG_ARGS=--bootstrap-kubeconfig=/gshcmy/certs/kubeconfig/bootstrap-kubelet.kubeconfig --kubeconfig=/gshcmy/certs/kubeconfig/kubelet.kubeconfig"
Environment="KUBELET_CONFIG_ARGS=--config=/etc/kubernetes/kubelet-conf.yml"
Environment="KUBELET_SYSTEM_ARGS=--container-runtime-endpoint=unix:///run/containerd/containerd.sock"
Environment="KUBELET_EXTRA_ARGS=--node-labels=node.kubernetes.io/node='' "
ExecStart=
ExecStart=/usr/local/bin/kubelet $KUBELET_KUBECONFIG_ARGS $KUBELET_CONFIG_ARGS $KUBELET_SYSTEM_ARGS $KUBELET_EXTRA_ARGS
EOF

启动所有节点kubelet
systemctl daemon-reload
systemctl enable --now kubelet
systemctl status kubelet

出现错误解决方案

如果出现报错:
nodes is forbidden: User \"system:anonymous\" cannot create resource \"nodes\" in API group \"\" at the cluster scope" node="k8s-master141"


解决方案:
[root@master143 ~]# cat test-rbac.yaml
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRoleBinding
metadata:
  name: gshcmy-kubelet-rbac
roleRef:
  apiGroup: rbac.authorization.k8s.io
  kind: ClusterRole
  name: cluster-admin
subjects:
- apiGroup: rbac.authorization.k8s.io
  kind: User
  name: system:anonymous
[root@master143 ~]# 
[root@master143 ~]# kubectl apply -f test-rbac.yaml
clusterrolebinding.rbac.authorization.k8s.io/oldboyedu-kubelet-rbac created
[root@master143 ~]# 

部署worker节点之kube-proxy服务

[root@master141 pki]# cat > kube-proxy-csr.json  <<EOF
{
  "CN": "system:kube-proxy",
  "key": {
    "algo": "rsa",
    "size": 2048
  },
  "names": [
    {
      "C": "CN",
      "ST": "Beijing",
      "L": "Beijing",
      "O": "system:kube-proxy",
      "OU": "Kubernetes-manual"
    }
  ]
}
EOF

创建kube-proxy需要的证书文件
[root@master141 pki]# cfssl gencert \
  -ca=/gshcmy/certs/kubernetes/k8s-ca.pem \
  -ca-key=/gshcmy/certs/kubernetes/k8s-ca-key.pem \
  -config=k8s-ca-config.json \
  -profile=kubernetes \
  kube-proxy-csr.json | cfssljson -bare /gshcmy/certs/kubernetes/kube-proxy

[root@master141 pki]# ll /gshcmy/certs/kubernetes/kube-proxy*
-rw-r--r-- 1 root root 1045 Dec 24 22:45 /gshcmy/certs/kubernetes/kube-proxy.csr
-rw------- 1 root root 1679 Dec 24 22:45 /gshcmy/certs/kubernetes/kube-proxy-key.pem
-rw-r--r-- 1 root root 1464 Dec 24 22:45 /gshcmy/certs/kubernetes/kube-proxy.pem

设置集群
[root@master141 pki]# kubectl config set-cluster gshcmy-k8s \
  --certificate-authority=/gshcmy/certs/kubernetes/k8s-ca.pem \
  --embed-certs=true \
  --server=https://10.0.0.140:8443 \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-proxy.kubeconfig

设置一个用户项
[root@master141 pki]# kubectl config set-credentials system:kube-proxy \
  --client-certificate=/gshcmy/certs/kubernetes/kube-proxy.pem \
  --client-key=/gshcmy/certs/kubernetes/kube-proxy-key.pem \
  --embed-certs=true \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-proxy.kubeconfig

设置一个上下文环境
[root@master141 pki]# kubectl config set-context kube-proxy@kubernetes \
  --cluster=gshcmy-k8s \
  --user=system:kube-proxy \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-proxy.kubeconfig

使用默认的上下文
[root@master141 pki]# kubectl config use-context kube-proxy@kubernetes \
  --kubeconfig=/gshcmy/certs/kubeconfig/kube-proxy.kubeconfig

将kube-proxy的systemd Service文件发送到其他节点
[root@master141 pki]# for NODE in master142 master143 worker144 worker145; do
     echo $NODE
     scp /gshcmy/certs/kubeconfig/kube-proxy.kubeconfig $NODE:/gshcmy/certs/kubeconfig/
done

所有节点创建kube-proxy.conf配置文件
cat > /etc/kubernetes/kube-proxy.yml << EOF
apiVersion: kubeproxy.config.k8s.io/v1alpha1
kind: KubeProxyConfiguration
bindAddress: 0.0.0.0
metricsBindAddress: 127.0.0.1:10249
clientConnection:
  acceptConnection: ""
  burst: 10
  contentType: application/vnd.kubernetes.protobuf
  kubeconfig: /gshcmy/certs/kubeconfig/kube-proxy.kubeconfig
  qps: 5
clusterCIDR: 10.100.0.0/16
configSyncPeriod: 15m0s
conntrack:
  max: null
  maxPerCore: 32768
  min: 131072
  tcpCloseWaitTimeout: 1h0m0s
  tcpEstablishedTimeout: 24h0m0s
enableProfiling: false
healthzBindAddress: 0.0.0.0:10256
hostnameOverride: ""
iptables:
  masqueradeAll: false
  masqueradeBit: 14
  minSyncPeriod: 0s
ipvs:
  masqueradeAll: true
  minSyncPeriod: 5s
  scheduler: "rr"
  syncPeriod: 30s
mode: "ipvs"
nodeProtAddress: null
oomScoreAdj: -999
portRange: ""
udpIdelTimeout: 250ms
EOF

所有节点使用systemd管理kube-proxy
cat > /usr/lib/systemd/system/kube-proxy.service << EOF
[Unit]
Description=gshcmy's Kubernetes Proxy
After=network.target

[Service]
ExecStart=/usr/local/bin/kube-proxy \
  --config=/etc/kubernetes/kube-proxy.yml \
  --v=2 
Restart=on-failure
LimitNOFILE=65536

[Install]
WantedBy=multi-user.target
EOF

所有节点启动kube-proxy
systemctl daemon-reload && systemctl enable --now kube-proxy
systemctl status kube-proxy
ss -ntl |grep 10249

网络插件calico部署案例

参考链接:
	https://docs.tigera.io/calico/latest/getting-started/kubernetes/quickstart
1.下载资源清单
[root@master142 ~]# wget https://raw.githubusercontent.com/projectcalico/calico/v3.28.0/manifests/tigera-operator.yaml

[root@master142 ~]# wget https://raw.githubusercontent.com/projectcalico/calico/v3.28.0/manifests/custom-resources.yaml@yuanbao

根据自己的K8S情况修改Pod网段
[root@master142 ~]# grep cidr custom-resources.yaml 
      cidr: 192.168.0.0/16
[root@master142 ~]# 
[root@master142 ~]# sed -i '/cidr/s#192.168#10.100#' custom-resources.yaml 
[root@master142 ~]# 
[root@master142 ~]# grep cidr custom-resources.yaml 
      cidr: 10.100.0.0/16

部署calico 
[root@master142 ~]# kubectl create -f tigera-operator.yaml 
[root@master142 ~]# 
[root@master142 ~]# kubectl create -f custom-resources.yaml 

查看calico是否部署成功
[root@master141 pki]# kubectl get pods -A -o wide
温馨提示:
	可能会出现镜像下载失败的情况,因此需要手动拉取镜像!

卸载calico 
[root@master142 ~]# kubectl delete -f custom-resources.yaml  -f  tigera-operator.yaml

部署Flannel

下载资源清单
[root@master141 ~]# wget https://github.com/flannel-io/flannel/releases/latest/download/kube-flannel.ym

修改资源清单
[root@k8s-master01 ~]# grep 16 kube-flannel.yml 
      "Network": "10.144.0.0/16",

[root@k8s-master01 ~]# sed -i '/Network/s#144#100#' kube-flannel.yml 

[root@k8s-master01 ~]# grep 16 kube-flannel.yml 
      "Network": "10.100.0.0/16",

[root@k8s-master01 ~]# grep image kube-flannel.yml 
        image: docker.io/flannel/flannel:v0.25.4
        image: docker.io/flannel/flannel-cni-plugin:v1.4.1-flannel1
        image: docker.io/flannel/flannel:v0.25.4

[root@k8s-master01 ~]# sed -i 's#docker.io/flannel/flannel:v0.25.4#docker.io/flannel/flannel:v0.25.3#' kube-flannel.yml 

[root@k8s-master01 ~]# grep image kube-flannel.yml 
        image: docker.io/flannel/flannel:v0.25.3
        image: docker.io/flannel/flannel-cni-plugin:v1.4.1-flannel1
        image: docker.io/flannel/flannel:v0.25.3

部署Flannel
kubectl apply -f kube-flannel.yml 
查看flannel 组件
kubectl get pods -A -o wide

查看集群是否正常
 kubectl get nodes

发表回复

您的邮箱地址不会被公开。 必填项已用 * 标注