-
Notifications
You must be signed in to change notification settings - Fork 131
/
Copy pathomnia.yml
216 lines (188 loc) · 4.79 KB
/
omnia.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
# Copyright 2022 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Validate the cluster
hosts: localhost
connection: local
gather_facts: no
roles:
- cluster_validation
- name: Gather facts from all the nodes
hosts: manager, compute, login_node, nfs_node
- name: Validate hostname
hosts: manager, login_node
gather_facts: false
any_errors_fatal: true
roles:
- hostname_validation
tags: freeipa
- name: BeeGFS validation
hosts: manager, compute
gather_facts: false
any_errors_fatal: true
roles:
- beegfs_validation
tags: beegfs
- name: Apply common installation and config
hosts: manager, compute, login_node, nfs_node
gather_facts: false
any_errors_fatal: true
roles:
- common
tags: common
- name: Configure NFS node for SAS protocol
hosts: nfs_node
gather_facts: false
vars:
ansible_ssh_common_args: '-o StrictHostKeyChecking=no'
roles:
- nfs_sas
tags: nfs_server_sas
- name: Configure NFS node for ISCSI protocol
hosts: nfs_node
gather_facts: false
vars:
ansible_ssh_common_args: '-o StrictHostKeyChecking=no'
roles:
- nfs_iscsi
tags: nfs_server_iscsi
- name: Apply NFS client installation and config
hosts: manager, compute, login_node
gather_facts: false
roles:
- nfs_client
tags: nfs_client
- name: Apply login common installation and config
hosts: manager, login_node
gather_facts: false
roles:
- login_common
tags: freeipa
- name: Apply login server installation and config
hosts: manager
gather_facts: false
roles:
- login_server
tags: freeipa
- name: Apply login node installation and config
hosts: login_node
gather_facts: false
roles:
- login_node
tags: freeipa
- name: Apply common K8s installation and config
hosts: manager, compute
gather_facts: false
roles:
- k8s_common
tags: kubernetes
- name: Apply K8s manager config
hosts: manager
gather_facts: true
roles:
- k8s_manager
tags: kubernetes
- name: Apply K8s firewalld config on manager and compute nodes
hosts: manager, compute
gather_facts: false
roles:
- k8s_firewalld
tags: kubernetes
- name: Apply NFS server setup on manager node
hosts: manager
gather_facts: false
tasks:
- name: Apply NFS server setup on manager node
include_role:
name: k8s_nfs_server_setup
when: not hostvars['127.0.0.1']['powervault_status']
tags: [ kubernetes, k8s_pv_nfs ]
- name: Apply NFS client setup on compute nodes
hosts: compute
gather_facts: false
tasks:
- name: Apply NFS client setup on compute nodes
include_role:
name: k8s_nfs_client_setup
when: not hostvars['127.0.0.1']['powervault_status']
tags: [ kubernetes, k8s_pv_nfs ]
- name: Start K8s on manager server
hosts: manager
gather_facts: true
roles:
- k8s_start_manager
tags: kubernetes
- name: Start K8s worker servers on compute nodes
hosts: compute
gather_facts: false
roles:
- k8s_start_workers
tags: kubernetes
- name: Start K8s worker servers on manager nodes
hosts: manager, compute
gather_facts: false
roles:
- k8s_start_services
tags: kubernetes
- name: Apply common Slurm installation and config
hosts: manager, compute, login_node
gather_facts: false
roles:
- slurm_common
tags: slurm
- name: Apply Slurm manager config
hosts: manager
gather_facts: false
roles:
- slurm_manager
tags: slurm
- name: Configure Slurm workers
hosts: compute, login_node
serial: 1
gather_facts: false
roles:
- slurm_workers
tags: slurm
- name: Start Slurm workers
hosts: compute, login_node
gather_facts: false
roles:
- slurm_workers_service
tags: slurm
- name: Start Slurm services
hosts: manager
gather_facts: false
roles:
- slurm_start_services
tags: slurm
- name: Install slurm exporter
hosts: manager
gather_facts: false
roles:
- slurm_exporter
tags: slurm
- name: Install slurm restd
hosts: manager
gather_facts: false
roles:
- slurm_restd
tags: slurm
- name: Apply BeeGFS client installation and config on manager and compute nodes
hosts: manager, compute
gather_facts: false
roles:
- beegfs_client
tags: beegfs
- name: Passwordless SSH between manager and compute nodes
import_playbook: control_plane/tools/passwordless_ssh.yml