Browse Source

Basic slurm

main
Dustin Frisch 1 year ago
parent
commit
4240539bca
No known key found for this signature in database GPG Key ID: B4C3BF012D9B26BE
  1. 1
      machines/manager/default.nix
  2. 5
      machines/manager/slurm.nix
  3. 1
      machines/node/default.nix
  4. 7
      machines/node/slurm.nix
  5. 1
      shared/default.nix
  6. 6
      shared/secrets.yaml
  7. 35
      shared/slurm.nix

1
machines/manager/default.nix

@ -18,6 +18,7 @@ with lib;
./cache.nix ./cache.nix
./rdma.nix ./rdma.nix
./mpi.nix ./mpi.nix
./slurm.nix
]; ];
deployment = { deployment = {

5
machines/manager/slurm.nix

@ -0,0 +1,5 @@
{
services.slurm = {
server.enable = true;
};
}

1
machines/node/default.nix

@ -9,6 +9,7 @@ with lib;
./disk.nix ./disk.nix
./network.nix ./network.nix
./users.nix ./users.nix
./slurm.nix
]; ];
deployment = { deployment = {

7
machines/node/slurm.nix

@ -0,0 +1,7 @@
{ config, ... }:
{
services.slurm = {
client.enable = true;
};
}

1
shared/default.nix

@ -7,6 +7,7 @@
./ssh.nix ./ssh.nix
./rdma.nix ./rdma.nix
./ssl.nix ./ssl.nix
./slurm.nix
"${modulesPath}/profiles/headless.nix" "${modulesPath}/profiles/headless.nix"
"${modulesPath}/profiles/all-hardware.nix" "${modulesPath}/profiles/all-hardware.nix"

6
shared/secrets.yaml

@ -3,6 +3,8 @@ ldap:
password: ENC[AES256_GCM,data:IFPwehOGSYore+HEv7MyymCKaOKn5XEH,iv:JTrZucSL/MohMgUdWqalpgjCCh7ueXd3cgNB0FuJo/U=,tag:o/1nvTrfojYsXYeuvxKfNg==,type:str] password: ENC[AES256_GCM,data:IFPwehOGSYore+HEv7MyymCKaOKn5XEH,iv:JTrZucSL/MohMgUdWqalpgjCCh7ueXd3cgNB0FuJo/U=,tag:o/1nvTrfojYsXYeuvxKfNg==,type:str]
beegfs: beegfs:
connection: ENC[AES256_GCM,data:YTHMg76+5Azb+ex5ArUHt4xP+YYWr9Ph,iv:TEf8i+yezPsaW12Lg5jRnhds9uW9WhV6duZPdxeW9co=,tag:bPGsl7ofwE1Jh+FTyHJqzQ==,type:str] connection: ENC[AES256_GCM,data:YTHMg76+5Azb+ex5ArUHt4xP+YYWr9Ph,iv:TEf8i+yezPsaW12Lg5jRnhds9uW9WhV6duZPdxeW9co=,tag:bPGsl7ofwE1Jh+FTyHJqzQ==,type:str]
munge:
password: ENC[AES256_GCM,data:3cVMO9Q5G/UyM8r2x/XG0sHJalt4cvTZpw1o9tdUVeJ5sm6kWdhzCYu2mTnHn10A8gPtnP16Cibj+hwgT3Ib/g==,iv:dOeQyOmWwDB6irEyqNmPGHhZdgRhLQsQt48lKAX9jh4=,tag:OBZzzfCz04JOa7GmCbGCTw==,type:str]
sops: sops:
kms: [] kms: []
gcp_kms: [] gcp_kms: []
@ -81,8 +83,8 @@ sops:
c01zMTA2dnZlTGxGd0oxYklXMHdWTUkKYjSQ7Y16AXfiLaOwsyV8LFjUtbUJ744A c01zMTA2dnZlTGxGd0oxYklXMHdWTUkKYjSQ7Y16AXfiLaOwsyV8LFjUtbUJ744A
uxlImBcQnbiPkJY4DRxmtrBrTSzfX1pdepNH8DR0ZpjpI/6bibHEag== uxlImBcQnbiPkJY4DRxmtrBrTSzfX1pdepNH8DR0ZpjpI/6bibHEag==
-----END AGE ENCRYPTED FILE----- -----END AGE ENCRYPTED FILE-----
lastmodified: "2023-06-27T09:58:35Z"
mac: ENC[AES256_GCM,data:pPgwJnUdwQegqaCXdh7lweQq2Kos6szvo/mfBul+2TruUSSRXlGwKmNVLM2BuodMNZpTan2vCyvVlXvN4zBfW6nVWPzlBrCTbgtyBNodB+k3OJsfgUElQ32T9KccsMVuUsfKDzjhlFnV3NA9A7DVnrYz+jf1NcNSsz4yOjHudzA=,iv:ciFHyXhIcNFlB9fhzcAX8LICIsGPWDe29fxtjmJ0G+s=,tag:oldhGvm8vfPnuhpIXIpVWw==,type:str]
lastmodified: "2023-07-07T10:50:20Z"
mac: ENC[AES256_GCM,data:84PcC2J2peF6ZyEWH4o8gFw1yopC2o7DN5fg2I1+eUQVRmm8WqJbMkIF2taQeJndliEvsPBg6XXvbtJqdTs2L8o4EkkEwK4whbIosFyuVBuI3NRjjc1qswyYHudZa8CAtXPrVXqtD0q5QOtHwlUdGAyoBCpT8x2ZFaeye+JDuec=,iv:GhvwtEQMZlojwi0KoKUAQeuL53a0EFw1h+ysI9jeMuU=,tag:YJ8iYskhY8r3nDJIYxMusA==,type:str]
pgp: pgp:
- created_at: "2023-07-05T13:59:05Z" - created_at: "2023-07-05T13:59:05Z"
enc: | enc: |

35
shared/slurm.nix

@ -0,0 +1,35 @@
{ pkgs, lib, config, nodes, ... }:
with lib;
{
services.slurm = {
clusterName = "mogli";
controlMachine = "manager";
nodeName = map
(node: "${node.config.networking.hostName} CPUs=64")
(filter
(node: elem "node" node.config.deployment.tags)
(attrValues nodes));
partitionName = [
"all Nodes=ALL AllowGroups=cluster Default=YES MaxTime=INFINITE State=UP"
];
extraConfig = ''
MailProg=${pkgs.coreutils}/bin/false
'';
};
services.munge = {
enable = true;
password = config.sops.secrets."munge/password".path;
};
sops.secrets."munge/password" = {
sopsFile = ./secrets.yaml;
owner = "munge";
};
}
Loading…
Cancel
Save