omnia.yml 3.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148
  1. # Copyright 2020 Dell Inc. or its subsidiaries. All Rights Reserved.
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. ---
  15. - name: Validate the cluster
  16. hosts: localhost
  17. connection: local
  18. gather_facts: no
  19. roles:
  20. - cluster_validation
  21. - name: Gather facts from all the nodes
  22. hosts: all
  23. - name: Prepare the cluster with passwordless ssh from manager to compute
  24. hosts: manager
  25. gather_facts: false
  26. pre_tasks:
  27. - name: Set Fact
  28. set_fact:
  29. ssh_to: "{{ groups['compute'] }}"
  30. roles:
  31. - cluster_preperation
  32. - name: Prepare the cluster with passwordless ssh from compute to manager
  33. hosts: compute
  34. gather_facts: false
  35. pre_tasks:
  36. - name: Set Fact
  37. set_fact:
  38. ssh_to: "{{ groups['manager'] }}"
  39. roles:
  40. - cluster_preperation
  41. - name: Apply common installation and config
  42. hosts: manager, compute
  43. gather_facts: false
  44. roles:
  45. - common
  46. tags: common
  47. - name: Apply common K8s installation and config
  48. hosts: manager, compute
  49. gather_facts: false
  50. roles:
  51. - k8s_common
  52. tags: kubernetes
  53. - name: Apply GPU node config
  54. hosts: gpus
  55. gather_facts: false
  56. roles:
  57. - compute_gpu
  58. - name: Apply K8s manager config
  59. hosts: manager
  60. gather_facts: true
  61. roles:
  62. - k8s_manager
  63. tags: kubernetes
  64. - name: Apply K8s firewalld config on manager and compute nodes
  65. hosts: manager, compute
  66. gather_facts: false
  67. roles:
  68. - k8s_firewalld
  69. tags: kubernetes
  70. - name: Apply NFS server setup on manager node
  71. hosts: manager
  72. gather_facts: false
  73. roles:
  74. - k8s_nfs_server_setup
  75. tags: kubernetes
  76. - name: Apply NFS client setup on compute nodes
  77. hosts: compute
  78. gather_facts: false
  79. roles:
  80. - k8s_nfs_client_setup
  81. tags: kubernetes
  82. - name: Start K8s on manager server
  83. hosts: manager
  84. gather_facts: true
  85. roles:
  86. - k8s_start_manager
  87. tags: kubernetes
  88. - name: Start K8s worker servers on compute nodes
  89. hosts: compute
  90. gather_facts: false
  91. roles:
  92. - k8s_start_workers
  93. tags: kubernetes
  94. - name: Start K8s worker servers on manager nodes
  95. hosts: manager
  96. gather_facts: false
  97. roles:
  98. - k8s_start_services
  99. tags: kubernetes
  100. - name: Apply common Slurm installation and config
  101. hosts: manager, compute
  102. gather_facts: false
  103. roles:
  104. - slurm_common
  105. tags: slurm
  106. - name: Apply Slurm manager config
  107. hosts: manager
  108. gather_facts: false
  109. roles:
  110. - slurm_manager
  111. tags: slurm
  112. - name: Start Slurm workers
  113. hosts: compute
  114. gather_facts: false
  115. roles:
  116. - slurm_workers
  117. tags: slurm
  118. - name: Start Slurm services
  119. hosts: manager
  120. gather_facts: false
  121. roles:
  122. - slurm_start_services
  123. tags: slurm
  124. - name: Install slurm exporter
  125. hosts: manager
  126. gather_facts: false
  127. roles:
  128. - slurm_exporter
  129. tags: slurm