Skip to content

Latest commit

 

History

History
384 lines (296 loc) · 9.38 KB

README.md

File metadata and controls

384 lines (296 loc) · 9.38 KB

quick-install-with-kubeadm

centos7.3下利用kubeadm快速安装kubernets

k8s环境
主机名 内网ip 外网ip
k8s-master 172.16.0.69 ...
k8s-node-1 172.16.0.70 -
k8s-node-2 172.16.0.71 -
  1. 更新语言
/etc/environment
LC_ALL=en_US.utf8
LC_CTYPE=en_US.utf8
LANG=en_US.utf8
  1. 需改hosts节点
vi /etc/hosts
172.16.0.69 k8s-master
172.16.0.70 k8s-node-1
172.16.0.71 k8s-node-2
  1. 关闭防火墙
systemctl stop firewalld
systemctl disable firewalld
  1. 禁用Selinux
setenforce 0
sed -i --follow-symlinks 's/SELINUX=enforcing/SELINUX=disabled/g' /etc/sysconfig/selinux
  1. 设置内核参数
cat <<EOF > /etc/sysctl.d/k8s.conf
net.bridge.bridge-nf-call-ip6tables = 1
net.bridge.bridge-nf-call-iptables = 1
net.ipv4.ip_forward = 1
EOF

sysctl --system && modprobe br_netfilter
  1. 开启ipvs(加载IPVS模块)
cat > /etc/sysconfig/modules/ipvs.modules <<EOF
#!/bin/bash
modprobe -- ip_vs
modprobe -- ip_vs_rr
modprobe -- ip_vs_wrr
modprobe -- ip_vs_sh
modprobe -- nf_conntrack_ipv4
EOF


chmod 755 /etc/sysconfig/modules/ipvs.modules && bash /etc/sysconfig/modules/ipvs.modules && lsmod | grep -e ip_vs -e nf_conntrack_ipv4
  1. 安装docker
#设置国内yum源
wget https://mirrors.aliyun.com/docker-ce/linux/centos/docker-ce.repo -O /etc/yum.repos.d/docker-ce.repo

#安装docker 
yum install -y yum-utils device-mapper-persistent-data lvm2

yum -y install docker-ce-18.09.6-3.el7

#启动docker服务
systemctl enable docker && systemctl start docker
docker --version

#修改各个节点上docker的将cgroup driver改为systemd
mkdir /etc/docker

# Setup daemon.
cat > /etc/docker/daemon.json <<EOF
{
  "exec-opts": ["native.cgroupdriver=systemd"],
  "log-driver": "json-file",
  "log-opts": {
    "max-size": "100m"
  },
  "storage-driver": "overlay2",
  "storage-opts": [
    "overlay2.override_kernel_check=true"
  ]
}
EOF

mkdir -p /etc/systemd/system/docker.service.d

# Restart Docker
systemctl daemon-reload
systemctl restart docker

8.安装etcd

#cfssl安装
wget https://pkg.cfssl.org/R1.2/cfssl_linux-amd64
wget https://pkg.cfssl.org/R1.2/cfssljson_linux-amd64
wget https://pkg.cfssl.org/R1.2/cfssl-certinfo_linux-amd64
chmod +x cfssl_linux-amd64 cfssljson_linux-amd64 cfssl-certinfo_linux-amd64
mv cfssl_linux-amd64 /usr/local/bin/cfssl
mv cfssljson_linux-amd64 /usr/local/bin/cfssljson
mv cfssl-certinfo_linux-amd64 /usr/bin/cfssl-certinfo

#生成etcd ca证书和私钥 初始化ca
cfssl gencert -initca ca-csr.json | cfssljson -bare ca 

#生成server证书
cfssl gencert -ca=ca.pem -ca-key=ca-key.pem -config=ca-config.json -profile=etcd server-csr.json | cfssljson -bare server

#配置etcd启动文件
cp /k8s/etcd/cfg/backup/etcd.service /usr/lib/systemd/system/

#配置etcd文件
cp /k8s/etcd/cfg/backup/etcd.conf.0N /k8s/etcd/cfg/etcd.conf

#启动etcd
systemctl daemon-reload
systemctl enable etcd
systemctl start etcd

#查看服务装填
systemctl status etcd

#切换etcd版本
export ETCDCTL_API=2,[3]

#v2操作命令

#查看集群成员
/k8s/etcd/bin/etcdctl \
--ca-file=/k8s/etcd/ssl/ca.pem \
--cert-file=/k8s/etcd/ssl/server.pem \
--key-file=/k8s/etcd/ssl/server-key.pem \
--endpoints="https://172.16.0.69:2379,https://172.16.0.70:2379,https://172.16.0.71" \
member list

#查看集群健康
/k8s/etcd/bin/etcdctl \
--ca-file=/k8s/etcd/ssl/ca.pem \
--cert-file=/k8s/etcd/ssl/server.pem \
--key-file=/k8s/etcd/ssl/server-key.pem \
--endpoints="https://172.16.0.69:2379,https://172.16.0.70:2379,https://172.16.0.71" \
cluster-health

#v3操作命令
/k8s/etcd/bin/etcdctl \
--cacert=/k8s/etcd/ssl/ca.pem \
--cert=/k8s/etcd/ssl/server.pem \
--key=/k8s/etcd/ssl/server-key.pem \
--endpoints="https://172.16.0.69:2379,https://172.16.0.70:2379,https://172.16.0.71:2379" \
member list

一般故障处理步骤

  • etcdctl member remove ID
  • etcdctl member add NAME url:2380
  • 修改故障etcd配置:
CD_INITIAL_CLUSTER_STATE=existing #修改,从new改为existing
  • 运行
systemctl daemon-reload
  • 启动故障etcd

#其他工具:etcd数据迁移工具:见 /k8s/kubernets/tools/

  1. 安装k8s
#新增yum源
cat <<EOF > /etc/yum.repos.d/kubernetes.repo
[kubernetes]
name=Kubernetes
baseurl=https://mirrors.aliyun.com/kubernetes/yum/repos/kubernetes-el7-x86_64/
enabled=1
gpgcheck=1
repo_gpgcheck=1
gpgkey=https://mirrors.aliyun.com/kubernetes/yum/doc/yum-key.gpg 
    https://mirrors.aliyun.com/kubernetes/yum/doc/rpm-package-key.gpg
EOF

yum makecache fast
yum list |grep kube

yum install -y kubelet-1.14.3 kubeadm-1.14.3 kubectl-1.14.3 ipvsadm

#产生初始化配置文件 :100
kubeadm config print init-default > kubeadm.conf 
kubeadm init --config kubeadm.conf

#更新网络插件
kubectl apply /k8s/kubernets/app/Canal/rbac.yaml
kubectl apply -f /k8s/kubernets/app/Canal/canal.yaml

# 开机自动启动
systemctl status kubelet
systemctl start kubelet

:100 执行完毕,会展示如下类似的命令
kubeadm join api-server:6443 --token abcdef.0123456789abcdef \
    --discovery-token-ca-cert-hash sha256:token-value
在node机上再执行上述命令,就将node机器加到了网络里了

  1. 常用命令
kubectl get cs
kubectl get nodes --all-namespaces
kubectl get services --all-namespaces
kubeadm reset #卸载集群时,master,node都要执行
kubectl drain node_name --delete-local-data --force --ignore-daemonsets # 驱逐node,原来的pod迁移到其他node
kubectl uncordon node_name # 恢复调度
kubectl cordon node_name #禁止调度,原来的pod不迁移

  1. docker私有库继承到k8s
kubectl create secret docker-registry lrj-alyun --docker-server=registry.cn-beijing.aliyuncs.com --docker-username=***** --docker-password=****** --docker-email=sunny_lrj@yeah.net 
  1. etcd管理面板
#https://github.com/evildecay/etcdkeeper
./etcdkeeper -p 8111  -usetls -cacert=/k8s/etcd/ssl/ca.pem  -cert=/k8s/etcd/ssl/server.pem -key=/k8s/etcd/ssl/server-key.pem -sep app -auth

#安装htpasswd命令
yum -y install httpd-tools
htpasswd -c ./auth myusername
kubectl create secret generic mysecret --from-file auth --namespace=monitoring 

#ingress采用basic-auth验证:参看etcd-ui.yaml,生成k8s的secret
htpasswd -bc auth username password
kubectl create secret generic my-secret --from-file=/path/auth
  1. NFS挂载
#安装
yum install -y nfs-utils rpcbind

vim /etc/exports
追加内容:/k8s/kubernets/data *(rw,sync,no_root_squash)


exportfs -r

systemctl enable rpcbind
systemctl start rpcbind

systemctl enable nfs
systemctl start nfs

#查看共享点
showmount -e 172.16.0.69

#挂载磁盘
mount -t nfs -o nolock k8s-master:/k8s/kubernets/data /k8s_data
  1. confd产生配置文件
 confd -onetime -backend etcdv3 -node https://172.16.0.69:2379 \
 -client-ca-keys /k8s/etcd/ssl/ca.pem \
 -client-cert /k8s/etcd/ssl/server.pem \
 -client-key /k8s/etcd/ssl/server-key.pem 
  1. traefik支持https 参考地址
kubectl create secret generic A-cert \
--from-file=/k8s/kubernets/data/http-ssl/A/A.com.crt \
--from-file=/k8s/kubernets/data/http-ssl/A.com.key \
-n kube-system

kubectl create configmap traefik-conf --from-file=traefik.toml -n kube-system

#给节点打标签,只在bind_node=true上运行
kubectl label nodes k8s-master bind_domain=1

# 查看具有bind_domain的机器
kubectl get node -l "bind_domain=1"
      
  1. k8s系统升级
#master上执行:
yum install -y kubeadm-1.15.1  

#查看升级计划
kubeadm upgrade plan

#升级
kubeadm upgrade apply v1.15.1

yum install kubectl-1.15.1 kebulet-1.15.1 -y

systemctl daemon-reload
systemctl restart kubelet


#work上运行
yum install -y kubeadm-1.15.1
kubectl drain k8s-node-1--ignore-daemonsets //master上运行,该节点上的pod会迁移到其他节点

kubeadm upgrade node config --kubelet-version v1.15.1
yum install kubectl-1.15.1 kebulet-1.15.1 -y

systemctl daemon-reload
systemctl restart kubelet

kubectl uncordon k8s-node-1 //master执行,恢复调度到该节点

#其他节点同样操作

参考链接

  1. 证书更新
#查看证书到期时间
kubeadm alpha certs check-expiration

#更新证书
kubeadm alpha certs renew  all

# 更新配置文件

kubeadm init phase kubeconfig all --config /etc/kubernetes/kubeadm-config.yaml
cp /etc/kubernetes/admin.conf ~/.kube/config 

坑: 因为是外挂的etcd集群,在命令执行里 ,会提示找不到etcd的证书,比如:

failed to load existing certificate etcd/healthcheck-client: open /etc/kubernetes/pki/etcd/healthcheck-client.crt: no such file or directory

failure loading etcd/ca certificate authority: failed to load key: couldn't load the private key file

failed to load existing certificate etcd/peer: open /etc/kubernetes/pki/etcd/peer.crt: no such file or directory

/etc/kubernetes/pki/etcd/ca.key: open /etc/kubernetes/pki/etcd/ca.key: no such file or directory

此时只需要把之前的etcd证书,ca证书按报错提示的名字复制到相关目录下。

  1. pod回退
#查看版本记录,并退回到指定版本
kubectl rollout history deployment deployment_name
kubectl rollout undo deployment deployment_name --to-revision=1

退回上一个版本
kubectl rollout undo deployment/nginx-deployment
  1. prometheus监控
    拷贝k8s证书到prometheus目录内
cp /etc/kubernets/pki/* ./XXX

#执行prometheus目录里的yaml