Skip to content

Commit

Permalink
apply resource schema
Browse files Browse the repository at this point in the history
  • Loading branch information
andre-merzky committed Aug 2, 2023
1 parent e80ed79 commit 7d6864e
Show file tree
Hide file tree
Showing 14 changed files with 486 additions and 420 deletions.
214 changes: 104 additions & 110 deletions src/radical/pilot/configs/resource_access.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,16 +3,16 @@
"expanse": {
"description" : "(https://www.sdsc.edu/support/user_guides/expanse.html).",
"notes" : "Always set the ``project`` attribute in the PilotDescription.",
"schemas" : ["local", "ssh"],
"local" :
{
"job_manager_endpoint" : "slurm://expanse.sdsc.xsede.org",
"filesystem_endpoint" : "file://expanse.sdsc.xsede.org"
},
"ssh" :
{
"job_manager_endpoint" : "slurm+ssh://expanse.sdsc.xsede.org",
"filesystem_endpoint" : "sftp://expanse.sdsc.xsede.org"
"default_schema" : "local",
"schemas" : {
"local" : {
"job_manager_endpoint" : "slurm://expanse.sdsc.xsede.org",
"filesystem_endpoint" : "file://expanse.sdsc.xsede.org"
},
"ssh" : {
"job_manager_endpoint" : "slurm+ssh://expanse.sdsc.xsede.org",
"filesystem_endpoint" : "sftp://expanse.sdsc.xsede.org"
}
},
"default_remote_workdir" : "/expanse/lustre/scratch/$USER/temp_project",
"default_queue" : "compute",
Expand Down Expand Up @@ -41,22 +41,21 @@
"stampede2_ssh": {
"description" : "The ACCESS 'Stampede' cluster at TACC (https://docs.tacc.utexas.edu/hpc/stampede2/).",
"notes" : "Always set the ``project`` attribute in the PilotDescription or the pilot will fail.",
"schemas" : ["local", "gsissh", "ssh"],
"mandatory_args" : ["project"],
"gsissh" :
{
"job_manager_endpoint" : "slurm+gsissh://stampede2.tacc.utexas.edu:2222/",
"filesystem_endpoint" : "gsisftp://stampede2.tacc.utexas.edu:2222/"
},
"ssh" :
{
"job_manager_endpoint" : "slurm+ssh://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "sftp://stampede2.tacc.utexas.edu/"
},
"local" :
{
"job_manager_endpoint" : "slurm://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "file://stampede2.tacc.utexas.edu/"
"default_schema" : "local",
"schemas" : {
"gsissh" : {
"job_manager_endpoint": "slurm+gsissh://stampede2.tacc.utexas.edu:2222/",
"filesystem_endpoint" : "gsisftp://stampede2.tacc.utexas.edu:2222/"
},
"ssh" : {
"job_manager_endpoint": "slurm+ssh://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "sftp://stampede2.tacc.utexas.edu/"
},
"local" : {
"job_manager_endpoint": "slurm://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "file://stampede2.tacc.utexas.edu/"
}
},
"default_queue" : "normal",
"resource_manager" : "SLURM",
Expand Down Expand Up @@ -89,22 +88,21 @@
"stampede2_mpirun": {
"description" : "The ACCESS 'Stampede' cluster at TACC (https://docs.tacc.utexas.edu/hpc/stampede2/).",
"notes" : "Always set the ``project`` attribute in the PilotDescription or the pilot will fail.",
"schemas" : ["local", "gsissh", "ssh"],
"mandatory_args" : ["project"],
"gsissh" :
{
"job_manager_endpoint" : "slurm+gsissh://stampede2.tacc.utexas.edu:2222/",
"filesystem_endpoint" : "gsisftp://stampede2.tacc.utexas.edu:2222/"
},
"ssh" :
{
"job_manager_endpoint" : "slurm+ssh://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "sftp://stampede2.tacc.utexas.edu/"
},
"local" :
{
"job_manager_endpoint" : "slurm://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "file://stampede2.tacc.utexas.edu/"
"default_schema" : "local",
"schemas" : {
"gsissh" : {
"job_manager_endpoint": "slurm+gsissh://stampede2.tacc.utexas.edu:2222/",
"filesystem_endpoint" : "gsisftp://stampede2.tacc.utexas.edu:2222/"
},
"ssh" : {
"job_manager_endpoint": "slurm+ssh://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "sftp://stampede2.tacc.utexas.edu/"
},
"local" : {
"job_manager_endpoint": "slurm://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "file://stampede2.tacc.utexas.edu/"
}
},
"default_queue" : "normal",
"resource_manager" : "SLURM",
Expand Down Expand Up @@ -133,22 +131,21 @@
"stampede2_ibrun_repex": {
"description" : "The ACCESS 'Stampede' cluster at TACC (https://docs.tacc.utexas.edu/hpc/stampede2/).",
"notes" : "Always set the ``project`` attribute in the PilotDescription or the pilot will fail.",
"schemas" : ["local", "gsissh", "ssh"],
"mandatory_args" : ["project"],
"gsissh" :
{
"job_manager_endpoint" : "slurm+gsissh://stampede2.tacc.utexas.edu:2222/",
"filesystem_endpoint" : "gsisftp://stampede2.tacc.utexas.edu:2222/"
},
"ssh" :
{
"job_manager_endpoint" : "slurm+ssh://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "sftp://stampede2.tacc.utexas.edu/"
},
"local" :
{
"job_manager_endpoint" : "slurm://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "file://stampede2.tacc.utexas.edu/"
"default_schema" : "local",
"schemas" : {
"gsissh" : {
"job_manager_endpoint": "slurm+gsissh://stampede2.tacc.utexas.edu:2222/",
"filesystem_endpoint" : "gsisftp://stampede2.tacc.utexas.edu:2222/"
},
"ssh" : {
"job_manager_endpoint": "slurm+ssh://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "sftp://stampede2.tacc.utexas.edu/"
},
"local" : {
"job_manager_endpoint": "slurm://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "file://stampede2.tacc.utexas.edu/"
}
},
"cores_per_node" : 68,
"default_queue" : "normal",
Expand Down Expand Up @@ -181,22 +178,21 @@
"stampede2_ibrun": {
"description" : "The ACCESS 'Stampede' cluster at TACC (https://docs.tacc.utexas.edu/hpc/stampede2/).",
"notes" : "Always set the ``project`` attribute in the ComputePilotDescription or the pilot will fail.",
"schemas" : ["local", "gsissh", "ssh"],
"mandatory_args" : ["project"],
"gsissh" :
{
"job_manager_endpoint" : "slurm+gsissh://stampede2.tacc.utexas.edu:2222/",
"filesystem_endpoint" : "gsisftp://stampede2.tacc.utexas.edu:2222/"
},
"ssh" :
{
"job_manager_endpoint" : "slurm+ssh://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "sftp://stampede2.tacc.utexas.edu/"
},
"local" :
{
"job_manager_endpoint" : "slurm://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "file://stampede2.tacc.utexas.edu/"
"default_schema" : "local",
"schemas" : {
"gsissh" : {
"job_manager_endpoint": "slurm+gsissh://stampede2.tacc.utexas.edu:2222/",
"filesystem_endpoint" : "gsisftp://stampede2.tacc.utexas.edu:2222/"
},
"ssh" : {
"job_manager_endpoint": "slurm+ssh://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "sftp://stampede2.tacc.utexas.edu/"
},
"local" : {
"job_manager_endpoint": "slurm://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "file://stampede2.tacc.utexas.edu/"
}
},
"cores_per_node" : 68,
"default_queue" : "normal",
Expand Down Expand Up @@ -226,22 +222,21 @@
"stampede2_srun": {
"description" : "The ACCESS 'Stampede' cluster at TACC (https://docs.tacc.utexas.edu/hpc/stampede2/).",
"notes" : "Always set the ``project`` attribute in the PilotDescription or the pilot will fail.",
"schemas" : ["local", "gsissh", "ssh"],
"mandatory_args" : ["project"],
"gsissh" :
{
"job_manager_endpoint" : "slurm+gsissh://stampede2.tacc.utexas.edu:2222/",
"filesystem_endpoint" : "gsisftp://stampede2.tacc.utexas.edu:2222/"
},
"ssh" :
{
"job_manager_endpoint" : "slurm+ssh://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "sftp://stampede2.tacc.utexas.edu/"
},
"local" :
{
"job_manager_endpoint" : "slurm://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "file://stampede2.tacc.utexas.edu/"
"default_schema" : "local",
"schemas" : {
"gsissh" : {
"job_manager_endpoint": "slurm+gsissh://stampede2.tacc.utexas.edu:2222/",
"filesystem_endpoint" : "gsisftp://stampede2.tacc.utexas.edu:2222/"
},
"ssh" : {
"job_manager_endpoint": "slurm+ssh://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "sftp://stampede2.tacc.utexas.edu/"
},
"local" : {
"job_manager_endpoint": "slurm://stampede2.tacc.utexas.edu/",
"filesystem_endpoint" : "file://stampede2.tacc.utexas.edu/"
}
},
"default_queue" : "normal",
"resource_manager" : "SLURM",
Expand Down Expand Up @@ -271,12 +266,13 @@
"comet": {
"description" : "The retired Comet HPC resource at SDSC 'HPC for the 99%%' (https://www.sdsc.edu/support/user_guides/comet.html).",
"notes" : "Always set the ``project`` attribute in the PilotDescription or the pilot will fail.",
"schemas" : ["ssh"],
"mandatory_args" : ["project"],
"ssh" :
{
"job_manager_endpoint" : "slurm+ssh://comet.sdsc.xsede.org/",
"filesystem_endpoint" : "sftp://comet.sdsc.xsede.org/"
"default_schema" : "ssh",
"schemas" : {
"ssh" : {
"job_manager_endpoint": "slurm+ssh://comet.sdsc.xsede.org/",
"filesystem_endpoint" : "sftp://comet.sdsc.xsede.org/"
}
},
"default_queue" : "compute",
"lfs_path_per_node" : "/scratch/$USER/$SLURM_JOB_ID",
Expand Down Expand Up @@ -306,27 +302,25 @@
"bridges2": {
"description" : "The ACCESS 'Bridges2' cluster at PSC (https://www.psc.edu/resources/bridges-2/user-guide-2-2/).",
"notes" : "Always set the ``project`` attribute in the PilotDescription.",
"schemas" : ["local", "interactive", "gsissh", "ssh"],
# "mandatory_args" : [],
"local" :
{
"job_manager_endpoint" : "slurm://bridges2.psc.xsede.org/",
"filesystem_endpoint" : "file://bridges2.psc.xsede.org/"
},
"interactive" :
{
"job_manager_endpoint" : "fork://localhost/",
"filesystem_endpoint" : "file://localhost/"
},
"gsissh" :
{
"job_manager_endpoint" : "slurm+gsissh://bridges2.psc.xsede.org:2222/",
"filesystem_endpoint" : "gsisftp://bridges2.psc.xsede.org:2222/"
},
"ssh" :
{
"job_manager_endpoint" : "slurm+ssh://bridges2.psc.xsede.org/",
"filesystem_endpoint" : "sftp://bridges2.psc.xsede.org/"
"default_schema" : "local",
"schemas" : {
"local" : {
"job_manager_endpoint": "slurm://bridges2.psc.xsede.org/",
"filesystem_endpoint" : "file://bridges2.psc.xsede.org/"
},
"interactive" : {
"job_manager_endpoint": "fork://localhost/",
"filesystem_endpoint" : "file://localhost/"
},
"gsissh" : {
"job_manager_endpoint": "slurm+gsissh://bridges2.psc.xsede.org:2222/",
"filesystem_endpoint" : "gsisftp://bridges2.psc.xsede.org:2222/"
},
"ssh" : {
"job_manager_endpoint": "slurm+ssh://bridges2.psc.xsede.org/",
"filesystem_endpoint" : "sftp://bridges2.psc.xsede.org/"
}
},
"default_queue" : "RM",
"resource_manager" : "SLURM",
Expand Down
60 changes: 33 additions & 27 deletions src/radical/pilot/configs/resource_anl.json
Original file line number Diff line number Diff line change
Expand Up @@ -3,12 +3,13 @@
"theta": {
"description" : "Cray XC40, 4392 nodes (Intel KNL 7230)",
"notes" : "Local instance of MongoDB and pre-set VE should be used.",
"schemas" : ["local"],
"local" :
{
"job_manager_hop" : "cobalt://localhost/",
"job_manager_endpoint" : "cobalt://localhost/",
"filesystem_endpoint" : "file://localhost/"
"default_schema" : "local",
"schemas" : {
"local" : {
"job_manager_hop" : "cobalt://localhost/",
"job_manager_endpoint": "cobalt://localhost/",
"filesystem_endpoint" : "file://localhost/"
}
},
"default_queue" : "debug-flat-quad",
"resource_manager" : "COBALT",
Expand All @@ -33,12 +34,13 @@
"theta_gpu": {
"description" : "Extension of Theta, 24 NVIDIA DGX A100 nodes",
"notes" : "Local instance of MongoDB and pre-set VE should be used.",
"schemas" : ["local"],
"local" :
{
"job_manager_hop" : "cobalt://localhost/",
"job_manager_endpoint" : "cobalt://localhost/",
"filesystem_endpoint" : "file://localhost/"
"default_schema" : "local",
"schemas" : {
"local" : {
"job_manager_hop" : "cobalt://localhost/",
"job_manager_endpoint": "cobalt://localhost/",
"filesystem_endpoint" : "file://localhost/"
}
},
"default_queue" : "full-node",
"resource_manager" : "COBALT",
Expand Down Expand Up @@ -66,11 +68,12 @@
"polaris": {
"description" : "AMD EPYC Milan 7543P 32 core CPU with four Nvidia A100 GPUs, 560 nodes",
"notes" : "Local instance of MongoDB and pre-set VE should be used.",
"schemas" : ["local"],
"local" :
{
"job_manager_endpoint" : "pbspro://localhost/",
"filesystem_endpoint" : "file://localhost/"
"default_schema" : "local",
"schemas" : {
"local" : {
"job_manager_endpoint": "pbspro://localhost/",
"filesystem_endpoint" : "file://localhost/"
}
},
"default_queue" : "debug-scaling",
"resource_manager" : "PBSPRO",
Expand All @@ -95,11 +98,12 @@
"polaris_interactive": {
"description" : "AMD EPYC Milan 7543P 32 core CPU with four Nvidia A100 GPUs, 560 nodes",
"notes" : "Local instance of MongoDB and pre-set VE should be used.",
"schemas" : ["interactive"],
"interactive" :
{
"job_manager_endpoint" : "fork://localhost/",
"filesystem_endpoint" : "file://localhost/"
"default_schema" : "interactive",
"schemas" : {
"interactive" : {
"job_manager_endpoint": "fork://localhost/",
"filesystem_endpoint" : "file://localhost/"
}
},
"resource_manager" : "PBSPRO",
"agent_config" : "default",
Expand All @@ -122,11 +126,13 @@
"arcticus": {
"description" : "JLSE Aurora testbed; 17x Coyote Pass nodes, 2x XeHP_SDV",
"notes" : "Duo two-factor login. Local instance of virtualenv should be used.",
"schemas" : [ "local" ],
"local" : {
"job_manager_hop" : "cobalt://localhost/",
"job_manager_endpoint" : "cobalt://localhost/",
"filesystem_endpoint" : "file://localhost/"
"default_schema" : "local",
"schemas" : {
"local" : {
"job_manager_hop" : "cobalt://localhost/",
"job_manager_endpoint": "cobalt://localhost/",
"filesystem_endpoint" : "file://localhost/"
}
},
# "forward_tunnel_endpoint" : "jlselogin5",
"default_queue" : "full-node",
Expand Down
Loading

0 comments on commit 7d6864e

Please sign in to comment.