Skip to content
Snippets Groups Projects
Commit 86b32344 authored by Trung Nguyen's avatar Trung Nguyen
Browse files

Merge branch 'mellanox_slurm' into 'master'

Update mellanox and slurm roles

See merge request hpc-team/ansible_cluster_in_a_box!247
parents 28371b7e cc7c328d
No related branches found
No related tags found
1 merge request!247Update mellanox and slurm roles
...@@ -53,7 +53,7 @@ ...@@ -53,7 +53,7 @@
set_fact: set_fact:
install_now: true install_now: true
reboot_now: true reboot_now: true
when: driver_version is failed or not desired_driver_version.stdout in driver_version.stdout when: driver_version | failed or not desired_driver_version.stdout in driver_version.stdout
- name: debug - print out value of install_now - name: debug - print out value of install_now
debug: var=install_now debug: var=install_now
...@@ -65,7 +65,7 @@ ...@@ -65,7 +65,7 @@
when: install_now when: install_now
- name: install drivers - name: install drivers
shell: ./mlnxofedinstall -q --add-kernel-support --force shell: ./mlnxofedinstall -q --add-kernel-support --force --skip-repo
args: args:
#more changes #more changes
chdir: "/tmp/{{ MELLANOX_DRIVER_SRC }}" chdir: "/tmp/{{ MELLANOX_DRIVER_SRC }}"
...@@ -87,9 +87,9 @@ ...@@ -87,9 +87,9 @@
register: reload_service register: reload_service
- name: enable roce_mode setting - name: enable roce_mode setting
service: name=roce_mode state=started enabled=True service: name=roce_mode state=started enabled=yes
become: true become: true
ignore_errors: yes
# #
# A REBOOT IS NEEDED AFTER SUCCESSFUL INSTALL # A REBOOT IS NEEDED AFTER SUCCESSFUL INSTALL
# #
......
--- ---
#note. do not add '.tgz' to driver src. done in playbook #note. do not add '.tgz' to driver src. done in playbook
#MELLANOX_DRIVER_SRC: "{% if ansible_os_family == 'RedHat' %}MLNX_OFED_LINUX-3.1-1.0.3-rhel7.1-x86_64-ext{% elif ansible_os_family == 'Debian' %}MLNX_OFED_LINUX-3.1-1.0.3-ubuntu14.04-x86_64{% endif %}" #MELLANOX_DRIVER_SRC: "{% if ansible_os_family == 'RedHat' %}MLNX_OFED_LINUX-4.4-1.0.0.0-rhel7.4-x86_64{% elif ansible_os_family == 'Debian' %}MLNX_OFED_LINUX-3.1-1.0.3-ubuntu14.04-x86_64{% endif %}"
#MELLANOX_DRIVER_SRC: "{% if ansible_os_family == 'RedHat' %}MLNX_OFED_LINUX-3.1-1.0.3-rhel7.2-x86_64-ext{% elif ansible_os_family == 'Debian' %}MLNX_OFED_LINUX-3.1-1.0.3-ubuntu14.04-x86_64{% endif %}" MELLANOX_DRIVER_SRC: "{% if ansible_os_family == 'RedHat' %}MLNX_OFED_LINUX-4.5-1.0.1.0-rhel7.6-x86_64{% elif ansible_os_family == 'Debian' %}MLNX_OFED_LINUX-3.1-1.0.3-ubuntu14.04-x86_64{% endif %}"
#MELLANOX_DRIVER_SRC: "{% if ansible_os_family == 'RedHat' %}MLNX_OFED_LINUX-3.4-1.0.0.0-rhel7.2-x86_64{% elif ansible_os_family == 'Debian' %}MLNX_OFED_LINUX-3.1-1.0.3-ubuntu14.04-x86_64{% endif %}"
# MELLANOX_DRIVER_SRC: "{% if ansible_os_family == 'RedHat' %}MLNX_OFED_LINUX-4.2-1.2.0.0-rhel7.4-x86_64{% elif ansible_os_family == 'Debian' %}MLNX_OFED_LINUX-3.1-1.0.3-ubuntu14.04-x86_64{% endif %}"
MELLANOX_DRIVER_SRC: "{% if ansible_os_family == 'RedHat' %}MLNX_OFED_LINUX-4.4-1.0.0.0-rhel7.4-x86_64{% elif ansible_os_family == 'Debian' %}MLNX_OFED_LINUX-3.1-1.0.3-ubuntu14.04-x86_64{% endif %}"
--- ---
slurm_use_vpn: False slurm_use_vpn: False
slurmctlddebug: {level: 9, log: '/var/log/slurm/slurmctld.log'} slurmddebug: {level: 5, log: '/var/log/slurm/slurmd.log'}
slurmddebug: {level: 9, log: '/var/log/slurm/slurmd.log'} slurmctlddebug: {level: 5, log: '/mnt/slurm-logs/slurmctld.log'}
slurmschedlog: {level: 9, log: '/var/log/slurm/slurmsched.log'} slurmdbdlog: {level: 5, log: '/mnt/slurm-logs/slurmdbd.log'}
slurmdbdlog: {level: 9, log: '/var/log/slurm/slurmdbd.log'}
slurmfairshare: {def: false, val: 10000} slurmfairshare: {def: false, val: 10000}
slurmdatadir: "/var/spool/slurm" slurmdatadir: "/var/spool/slurm"
slurmselecttype: "select/linear" slurmselecttype: "select/linear"
......
--- ---
- name: make sure slurmctld and slurmdb log dir exists
file: dest=/mnt/slurm-logs state=directory owner=root group=root mode=755
sudo: true
- name: make sure slurm conf dir exists - name: make sure slurm conf dir exists
file: dest={{ slurm_dir }}/etc state=directory file: dest={{ slurm_dir }}/etc state=directory
sudo: true sudo: true
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment