generated from clemsonciti/ood_jupyter
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathform.yml.erb
146 lines (131 loc) · 4.27 KB
/
form.yml.erb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
#<%-
# get _list_partitions
# p_cmd = "/opt/pbs/default/bin/qstat -Q | grep Rou | grep -v -E 'a100|p100|v100|k240|c1|c2|osg' | awk '{print $1}' | sort"
# begin
# output, status = Open3.capture2e(p_cmd)
# if status.success?
# _list_partitions = output.split("\n").map(&:strip).reject(&:blank?).sort
# else
# raise output
# end
# rescue => e
# _list_partitions = []
# p_error = e.message.strip
# end
#
#-%>
#---
# **MUST** set cluster id here that matches cluster configuration file located
# under /etc/ood/config/clusters.d/*.yml
cluster: "palmetto"
attributes:
# Palmetto PBS specific options
pbs_select:
label: "Number of resource chunks (select)"
value: "1"
pbs_ncpus:
label: "CPU cores per chunk (ncpus)"
value: "1"
help: |
<small> - Typical Palmetto compute nodes have <b>8, 12, 16, 20, 24, 28, 40, and 56</b> cores.<br>
- DGX nodes have <b>128</b> cores.<br>
- Bigmem nodes have <b>24, 32, 40, and 80</b> cores.
- <b>Users can request any number of cores that is smaller than the number of available cores.</b>
</small>
pbs_mem:
label: "Amount of memory per chunk (mem)"
value: "1gb"
help: |
<small> - Typical Palmetto compute nodes have <b>15gb, 30gb, 46gb, 62gb, 125gb, 372gb, 748gb, and 990gb</b> of memory.<br>
- DGX nodes have <b>990gb</b> of memory.<br>
- Bigmem nodes have <b>500gb and 750gb</b> and <b>1tb and 1.5tb</b> of memory.
</small>
pbs_ngpus:
label: "Number of GPUs per chunk (ngpus)"
widget: "select"
value: "0"
options:
- ["None",""]
- ["1",":ngpus=1"]
- ["2",":ngpus=2"]
- ["4",":ngpus=4"]
pbs_gpu_model:
label: "GPU Model (gpu_model)"
widget: "select"
value: "none"
options:
- ["None",""]
- ["Any", ":gpu_model=any"]
- ["K20",":gpu_model=k20"]
- ["K40",":gpu_model=k40"]
- ["P100",":gpu_model=p100"]
- ["V100",":gpu_model=v100"]
- ["V100 with NVLink",":gpu_model=v100nv"]
- ["A100",":gpu_model=a100"]
pbs_interconnect:
label: "Interconnect"
widget: "select"
value: "any"
options:
- ["any",""]
- ["1g - Ethernet older phases 1-6",":interconnect=1g"]
- ["10g - Ethernet phase 7-18 and phase 0 (bigmem queue)",":interconnect=10ge"]
- ["25g - Ethernet phase 18b-27",":interconnect=25ge"]
- ["56g - Ethernet phase 7-17",":interconnect=56g"]
- ["fdr - Infiniband phase 7-17",":interconnect=fdr"]
- ["hdr - Infiniband phase 18 and above",":interconnect=hdr"]
- ["100g - Ethernet phase 18 and above",":interconnect=100g"]
pbs_walltime:
label: "Walltime"
value: "00:30:00"
help: |
<small> - Walltime format is <b>hh:mm:ss</b>.<br>
- Phase 1 through 6 nodes can be reserved up to 336 hours.<br>
- Phase 7 through 27 nodes can be reserved up to 72 hours.
</small>
pbs_extras:
label: "Extra PBS resource allocation request"
value: ""
help: |
<small>- Enter the additional resource request just like how you would in a command line environment.<br>
- Each request should start with a colon <b>:</b> sign. <br>
- For example: <b>:chip_type=e5-2665</b></small>
pbs_queue:
label: "Queue"
required: true
help: |
<small>Queue to submit the job to</small>
widget: select
value: "work1"
options:
<%- CustomQueues.queues.each do |g| %>
- ["<%= g %>","<%= g %>"]
<%- end %>
images:
label: "Path to the container image"
value: ""
help: |
<small> Provide a path to the container image. This could be a link to
a Docker/Apptainer image or path to a directory/sif file<br>
- Docker example: <b>docker://jupyter/scipy-notebook</b><br>
- Local example: <b>/zfs/citi/container_images/scipy-notebook_latest.sif</b>
</small>
working_dir:
label: "Absolute path to working directory"
data-filepicker: true
data-target-file-type: dirs # Valid values are: files, dirs, or both
readonly: false
help: "Select your project directory; defaults to $HOME"
form:
- images
- pbs_select
- pbs_ncpus
- pbs_mem
- pbs_ngpus
- pbs_gpu_model
- pbs_interconnect
- pbs_extras
- pbs_walltime
- pbs_queue
- working_dir
- bc_email_on_started