This commit is contained in:
parent
6535633321
commit
484511359b
|
|
@ -35,15 +35,15 @@
|
|||
#### (1)系统初始化
|
||||
|
||||
```bash
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/system_optimize.sh|bash
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/system_optimize.sh|bash
|
||||
```
|
||||
|
||||
#### (2)MLNX_OFED 网络套件安装/卸载
|
||||
|
||||
```bash
|
||||
#支持版本[23.10-1.1.9.0]
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --uninstall --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --uninstall --version '23.10-1.1.9.0'
|
||||
```
|
||||
|
||||
|
||||
|
|
@ -51,8 +51,8 @@
|
|||
|
||||
```bash
|
||||
#支持版本[565.57.01] [570.124.06]
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --install --version '565.57.01'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '565.57.01'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --install --version '565.57.01'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '565.57.01'
|
||||
|
||||
|
||||
```
|
||||
|
|
@ -61,8 +61,8 @@
|
|||
|
||||
```bash
|
||||
#支持版本[565_565.57.01-1] [570_570.124.06-1]
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '565_565.57.01-1'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '565_565.57.01-1'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '565_565.57.01-1'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '565_565.57.01-1'
|
||||
```
|
||||
|
||||
|
||||
|
|
@ -70,20 +70,20 @@
|
|||
|
||||
```bash
|
||||
#支持版本[12.6.3_560.35.05] [12.8.1_570.124.06]
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --install --version '12.6.3_560.35.05'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --uninstall --version '12.6.3_560.35.05'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --install --version '12.6.3_560.35.05'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --uninstall --version '12.6.3_560.35.05'
|
||||
```
|
||||
|
||||
#### (6)dcgm/node exporter 部署/卸载
|
||||
|
||||
```bash
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-dcgm.sh | bash -s -- --install
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/dcgm-exporter.sh | bash -s -- --install
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/node-exporter.sh | bash -s -- --install
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-dcgm.sh | bash -s -- --install
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/dcgm-exporter.sh | bash -s -- --install
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/node-exporter.sh | bash -s -- --install
|
||||
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-dcgm.sh | bash -s -- --uninstall
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/dcgm-exporter.sh | bash -s -- --uninstall
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/node-exporter.sh | bash -s -- --uninstall
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-dcgm.sh | bash -s -- --uninstall
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/dcgm-exporter.sh | bash -s -- --uninstall
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/node-exporter.sh | bash -s -- --uninstall
|
||||
```
|
||||
|
||||
#### (7)批量组件安装/卸载
|
||||
|
|
@ -95,17 +95,17 @@
|
|||

|
||||
```bash
|
||||
安装:---------------------------------------------------------------------------------------------------------------------------------------------
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/system_optimize.sh|bash
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --install --version '565.57.01'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --install --version '12.6.3_560.35.05'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '565_565.57.01-1'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/system_optimize.sh|bash
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --install --version '565.57.01'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --install --version '12.6.3_560.35.05'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '565_565.57.01-1'
|
||||
|
||||
卸载:---------------------------------------------------------------------------------------------------------------------------------------------
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh |bash -s -- --uninstall --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '565.57.01'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --uninstall --version '12.6.3_560.35.05'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '565_565.57.01-1'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh |bash -s -- --uninstall --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '565.57.01'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --uninstall --version '12.6.3_560.35.05'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '565_565.57.01-1'
|
||||
```
|
||||
|
||||

|
||||
|
|
@ -115,35 +115,35 @@
|
|||

|
||||
```bash
|
||||
安装:---------------------------------------------------------------------------------------------------------------------------------------------
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/system_optimize.sh|bash
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --install --version '570.124.06'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --install --version '12.8.1_570.124.06'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '570_570.124.06-1'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/system_optimize.sh|bash
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --install --version '570.124.06'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --install --version '12.8.1_570.124.06'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '570_570.124.06-1'
|
||||
|
||||
|
||||
卸载:--------------------------------------------------------------------------------------------------------------------------------------------
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.shbash -s -- --uninstall --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '570.124.06'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --uninstall --version '12.8.1_570.124.06'
|
||||
cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '570_570.124.06-1'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.shbash -s -- --uninstall --version '23.10-1.1.9.0'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '570.124.06'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --uninstall --version '12.8.1_570.124.06'
|
||||
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '570_570.124.06-1'
|
||||
|
||||
```
|
||||

|
||||
```bash
|
||||
#安装/卸载服务(安装或卸载时间较长,建议放后台执行。):
|
||||
#组合[1]-----------------------------------------------------------------------------------------------------------------------------------
|
||||
screen -dmS install_script bash -c "cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --install --version 1 --include=exporter 2>&1 > /opt/gpu-manager.log";
|
||||
screen -dmS install_script bash -c "cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --install --version 1 --include=exporter 2>&1 > /opt/gpu-manager.log";
|
||||
tail -f /opt/gpu-manager.log
|
||||
|
||||
screen -dmS uninstall_script bash -c "cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --uninstall --version 1 --include=exporter 2>&1 > /opt/gpu-manager.log";
|
||||
screen -dmS uninstall_script bash -c "cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --uninstall --version 1 --include=exporter 2>&1 > /opt/gpu-manager.log";
|
||||
tail -f /opt/gpu-manager.log
|
||||
|
||||
#组合[2]-----------------------------------------------------------------------------------------------------------------------------------
|
||||
screen -dmS install_script bash -c "cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --install --version 2 --include=exporter 2>&1 > /opt/gpu-manager.log";
|
||||
screen -dmS install_script bash -c "cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --install --version 2 --include=exporter 2>&1 > /opt/gpu-manager.log";
|
||||
tail -f /opt/gpu-manager.log
|
||||
|
||||
screen -dmS uninstall_script bash -c "cd /opt/ && wget -qO- http://10.101.0.51:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --uninstall --version 2 --include=exporter 2>&1 > /opt/gpu-manager.log";
|
||||
screen -dmS uninstall_script bash -c "cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --uninstall --version 2 --include=exporter 2>&1 > /opt/gpu-manager.log";
|
||||
tail -f /opt/gpu-manager.log
|
||||
|
||||
#说明:
|
||||
|
|
|
|||
Loading…
Reference in New Issue