This commit is contained in:
joy 2025-07-05 18:09:24 +08:00
parent 484511359b
commit e8943adab5
1 changed files with 37 additions and 37 deletions

View File

@ -35,15 +35,15 @@
#### 1系统初始化
```bash
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/system_optimize.sh|bash
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/system_optimize.sh|bash
```
#### 2MLNX_OFED 网络套件安装/卸载
```bash
#支持版本[23.10-1.1.9.0]
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --uninstall --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/ib-drive.sh|bash -s -- --uninstall --version '23.10-1.1.9.0'
```
@ -51,8 +51,8 @@
```bash
#支持版本[565.57.01] [570.124.06]
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --install --version '565.57.01'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '565.57.01'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-driver.sh | bash -s -- --install --version '565.57.01'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '565.57.01'
```
@ -61,8 +61,8 @@
```bash
#支持版本[565_565.57.01-1] [570_570.124.06-1]
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '565_565.57.01-1'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '565_565.57.01-1'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '565_565.57.01-1'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '565_565.57.01-1'
```
@ -70,20 +70,20 @@
```bash
#支持版本[12.6.3_560.35.05] [12.8.1_570.124.06]
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --install --version '12.6.3_560.35.05'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --uninstall --version '12.6.3_560.35.05'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/cuda.sh | bash -s -- --install --version '12.6.3_560.35.05'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/cuda.sh | bash -s -- --uninstall --version '12.6.3_560.35.05'
```
#### 6dcgm/node exporter 部署/卸载
```bash
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-dcgm.sh | bash -s -- --install
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/dcgm-exporter.sh | bash -s -- --install
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/node-exporter.sh | bash -s -- --install
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-dcgm.sh | bash -s -- --install
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/dcgm-exporter.sh | bash -s -- --install
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/node-exporter.sh | bash -s -- --install
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-dcgm.sh | bash -s -- --uninstall
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/dcgm-exporter.sh | bash -s -- --uninstall
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/node-exporter.sh | bash -s -- --uninstall
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-dcgm.sh | bash -s -- --uninstall
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/dcgm-exporter.sh | bash -s -- --uninstall
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/node-exporter.sh | bash -s -- --uninstall
```
#### 7批量组件安装/卸载
@ -95,17 +95,17 @@
![Static Badge](https://img.shields.io/badge/fabricmanager-565_565.57.01.1-brightgreen?style=plastic)
```bash
安装:---------------------------------------------------------------------------------------------------------------------------------------------
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/system_optimize.sh|bash
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --install --version '565.57.01'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --install --version '12.6.3_560.35.05'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '565_565.57.01-1'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/system_optimize.sh|bash
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-driver.sh | bash -s -- --install --version '565.57.01'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/cuda.sh | bash -s -- --install --version '12.6.3_560.35.05'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '565_565.57.01-1'
卸载:---------------------------------------------------------------------------------------------------------------------------------------------
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh |bash -s -- --uninstall --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '565.57.01'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --uninstall --version '12.6.3_560.35.05'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '565_565.57.01-1'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/ib-drive.sh |bash -s -- --uninstall --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '565.57.01'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/cuda.sh | bash -s -- --uninstall --version '12.6.3_560.35.05'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '565_565.57.01-1'
```
![Static Badge](https://img.shields.io/badge/组件[2]-orange?style=flat-square)
@ -115,35 +115,35 @@
![Static Badge](https://img.shields.io/badge/fabricmanager-570.124.06.1-brightgreen?style=plastic)
```bash
安装:---------------------------------------------------------------------------------------------------------------------------------------------
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/system_optimize.sh|bash
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --install --version '570.124.06'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --install --version '12.8.1_570.124.06'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '570_570.124.06-1'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/system_optimize.sh|bash
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/ib-drive.sh|bash -s -- --install --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-driver.sh | bash -s -- --install --version '570.124.06'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/cuda.sh | bash -s -- --install --version '12.8.1_570.124.06'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-fabricmanager.sh|bash -s -- --install --version '570_570.124.06-1'
卸载:--------------------------------------------------------------------------------------------------------------------------------------------
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/ib-drive.shbash -s -- --uninstall --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '570.124.06'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/cuda.sh | bash -s -- --uninstall --version '12.8.1_570.124.06'
cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '570_570.124.06-1'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/ib-drive.shbash -s -- --uninstall --version '23.10-1.1.9.0'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-driver.sh | bash -s -- --uninstall --version '570.124.06'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/cuda.sh | bash -s -- --uninstall --version '12.8.1_570.124.06'
cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/nvidia-fabricmanager.sh|bash -s -- --uninstall --version '570_570.124.06-1'
```
![Static Badge](https://img.shields.io/badge/推荐一键安装脚本-orange?style=flat-square)
```bash
#安装/卸载服务(安装或卸载时间较长,建议放后台执行。)
#组合[1]-----------------------------------------------------------------------------------------------------------------------------------
screen -dmS install_script bash -c "cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --install --version 1 --include=exporter 2>&1 > /opt/gpu-manager.log";
screen -dmS install_script bash -c "cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/gpu-manager.sh|bash -s -- --install --version 1 --include=exporter 2>&1 > /opt/gpu-manager.log";
tail -f /opt/gpu-manager.log
screen -dmS uninstall_script bash -c "cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --uninstall --version 1 --include=exporter 2>&1 > /opt/gpu-manager.log";
screen -dmS uninstall_script bash -c "cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/gpu-manager.sh|bash -s -- --uninstall --version 1 --include=exporter 2>&1 > /opt/gpu-manager.log";
tail -f /opt/gpu-manager.log
#组合[2]-----------------------------------------------------------------------------------------------------------------------------------
screen -dmS install_script bash -c "cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --install --version 2 --include=exporter 2>&1 > /opt/gpu-manager.log";
screen -dmS install_script bash -c "cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/gpu-manager.sh|bash -s -- --install --version 2 --include=exporter 2>&1 > /opt/gpu-manager.log";
tail -f /opt/gpu-manager.log
screen -dmS uninstall_script bash -c "cd /opt/ && wget -qO- http://116.205.97.109:3000:3000/yindun/ansible-devops/raw/branch/main/scripts/gpu-manager.sh|bash -s -- --uninstall --version 2 --include=exporter 2>&1 > /opt/gpu-manager.log";
screen -dmS uninstall_script bash -c "cd /opt/ && wget -qO- http://yindun.muyun688.top/scripts/gpu-manager.sh|bash -s -- --uninstall --version 2 --include=exporter 2>&1 > /opt/gpu-manager.log";
tail -f /opt/gpu-manager.log
#说明