From 94740767e2fe47216f48e6bbbdb2bf7f0bd80c54 Mon Sep 17 00:00:00 2001 From: baol Date: Wed, 18 Dec 2024 09:21:45 +0800 Subject: [PATCH 1/3] fix n2 bug --- n2.slurm.sh | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/n2.slurm.sh b/n2.slurm.sh index b5ad931..d613a72 100755 --- a/n2.slurm.sh +++ b/n2.slurm.sh @@ -1,8 +1,11 @@ #!/bin/bash # 修改 /usr/lib/systemd/system/slurmd.service 文件 -sudo sed -i 's|ExecStart=/usr/sbin/slurmd --systemd $SLURMD_OPTIONS|ExecStart=/usr/sbin/slurmd --conf=/opt/slurm/slurm.conf --systemd $SLURMD_OPTIONS|' /usr/lib/systemd/system/slurmd.service +sudo cp /opt/slurm/slurm.conf /etc/slurm/ +sudo chown -R slurm: /var/log/slurm + +sudo chown -R slurm: /var/spool/slurmd # 重新加载 systemd 配置 sudo systemctl daemon-reload From ba7149e1148c935eef10d8cb261886cfb6d527b3 Mon Sep 17 00:00:00 2001 From: baol Date: Wed, 18 Dec 2024 09:33:21 +0800 Subject: [PATCH 2/3] change slurmd.service --- files/slurmd.service | 16 +++++++++++----- 1 file changed, 11 insertions(+), 5 deletions(-) diff --git a/files/slurmd.service b/files/slurmd.service index 37a2c90..417f6b8 100644 --- a/files/slurmd.service +++ b/files/slurmd.service @@ -1,13 +1,18 @@ [Unit] Description=Slurm node daemon -After=munge.service network-online.target remote-fs.target +After=munge.service network-online.target remote-fs.target sssd.service Wants=network-online.target -#ConditionPathExists=/opt/slurm/etc/slurm.conf +#ConditionPathExists=/etc/slurm/slurm.conf +Documentation=man:slurmd(8) [Service] -Type=simple -EnvironmentFile=-/etc/sysconfig/slurmd -ExecStart=/opt/slurm/sbin/slurmd -D -s $SLURMD_OPTIONS +User=slurm +Group=slurm +Type=notify +EnvironmentFile=-/etc/default/slurmd +RuntimeDirectory=slurm +RuntimeDirectoryMode=0755 +ExecStart=/usr/sbin/slurmd --systemd $SLURMD_OPTIONS ExecReload=/bin/kill -HUP $MAINPID KillMode=process LimitNOFILE=131072 @@ -23,3 +28,4 @@ TasksMax=infinity [Install] WantedBy=multi-user.target + From bdf9baddd1fbd7677079a18ec821ddebd0e49afe Mon Sep 17 00:00:00 2001 From: baol Date: Wed, 18 Dec 2024 09:36:41 +0800 Subject: [PATCH 3/3] fix bug --- files/slurm.conf | 2 +- n2.slurm.sh | 6 +++++- 2 files changed, 6 insertions(+), 2 deletions(-) diff --git a/files/slurm.conf b/files/slurm.conf index dd6acda..bd93b73 100755 --- a/files/slurm.conf +++ b/files/slurm.conf @@ -50,7 +50,7 @@ SlurmctldPort=6817 SlurmdPidFile=/var/run/slurmd.pid SlurmdPort=6818 SlurmdSpoolDir=/var/spool/slurmd -#SlurmUser=slurm +SlurmdUser=slurm #SlurmdUser=root #SrunEpilog= #SrunProlog= diff --git a/n2.slurm.sh b/n2.slurm.sh index d613a72..83f85cd 100755 --- a/n2.slurm.sh +++ b/n2.slurm.sh @@ -1,13 +1,17 @@ #!/bin/bash # 修改 /usr/lib/systemd/system/slurmd.service 文件 -sudo cp /opt/slurm/slurm.conf /etc/slurm/ +sudo cp /home/laoban/config/files/slurm.conf /etc/slurm/ sudo chown -R slurm: /var/log/slurm sudo chown -R slurm: /var/spool/slurmd + +sudo cp /home/laoban/config/files/slurmd.service /usr/lib/systemd/system/ + # 重新加载 systemd 配置 sudo systemctl daemon-reload + # 重启 slurmd 服务 sudo systemctl restart slurmd