From 68d4976a97b4f6c6375f37895e1425784c33eff9 Mon Sep 17 00:00:00 2001 From: IcyAltair Date: Fri, 26 Dec 2025 18:05:36 +0300 Subject: [PATCH] fixed ansible playbooks --- ansible/roles/more_check/tasks/main.yml | 23 +++++------------- ansible/roles/run/tasks/main.yml | 32 +++++-------------------- ansible/roles/stop/tasks/main.yml | 4 +++- docker-compose.yml | 2 +- master-node/docker-compose.yml | 8 +++++++ 5 files changed, 24 insertions(+), 45 deletions(-) create mode 100644 master-node/docker-compose.yml diff --git a/ansible/roles/more_check/tasks/main.yml b/ansible/roles/more_check/tasks/main.yml index 7aab7be..8ae22a1 100644 --- a/ansible/roles/more_check/tasks/main.yml +++ b/ansible/roles/more_check/tasks/main.yml @@ -6,21 +6,11 @@ ansible.builtin.shell: free -m | awk 'NR==2{printf "%d", ($2-$3)}' register: sys_mem_info -- name: Delete bm-smi log - ansible.builtin.shell: rm -f bm-smi.log - register: del_file - -- name: Save bm-smi log - ansible.builtin.shell: /opt/sophon/libsophon-0.4.8/bin/bm-smi -noloop --file=./bm-smi.log - register: save_file - -- name: Check used device memory - ansible.builtin.shell: cat bm-smi.log | grep -o '[0-9]\+MB/ ' | grep -o -E '[0-9]+' - register: dev_mem_info - -- name: Check used TPU - ansible.builtin.shell: cat bm-smi.log | grep -o '[0-9]\+%' | grep -o -E -m 1 '[0-9]+' - register: tpu_info +- name: Check used GPU + ansible.builtin.shell: | + nvidia-smi --query-gpu=utilization.gpu,memory.used,memory.total --format=csv,noheader,nounits + register: gpu_info + changed_when: false - name: Check used CPU ansible.builtin.shell: sar 1 1 | grep "Average" | awk '{print 100-$8}' @@ -35,7 +25,6 @@ msg: running: "{{ running_info.stdout_lines }}" sys_mem: "{{ sys_mem_info.stdout_lines }}" - dev_mem: "{{ dev_mem_info.stdout_lines }}" - tpu: "{{ tpu_info.stdout }}" + gpu: "{{ gpu_info.stdout }}" cpu: "{{ cpu_info.stdout }}" containers_ids: "{{ containers_id.stdout_lines }}" diff --git a/ansible/roles/run/tasks/main.yml b/ansible/roles/run/tasks/main.yml index 018fd84..02d3c6f 100644 --- a/ansible/roles/run/tasks/main.yml +++ b/ansible/roles/run/tasks/main.yml @@ -1,29 +1,9 @@ -- name: Create model weights directory if it does not exist - ansible.builtin.file: - path: /data/weights/synapse-faces-weights - state: directory - mode: '0775' - -- name: Run module - ansible.builtin.shell: docker run \ - -d \ - --rm \ - --privileged=true \ - -v /opt/sophon:/opt/sophon \ - -v /etc/profile.d:/etc/profile.d \ - -v /etc/ld.so.conf.d:/etc/ld.so.conf.d \ - -v /data/weights/synapse-faces-weights:/server/data/weights/int8 \ - -e DETECTOR_SIZE={{ size }} \ - -e TZ="Europe/Moscow" \ - -e MINIO_ENDPOINT="{{ MINIO_ENDPOINT }}" \ - -e MINIO_ACCESS_KEY="{{ MINIO_ACCESS_KEY }}" \ - -e MINIO_SECRET_KEY="{{ MINIO_SECRET_KEY }}" \ - -e MINIO_PUB_CERT="{{ MINIO_PUB_CERT }}" \ - -p {{ port }}:9000 \ - --workdir /server \ - --name faces_service_{{ port }} {{ image }} /bin/bash docker/tpu/entry.sh - - register: run_info +- name: Run docker compose up + ansible.builtin.shell: + cmd: docker compose up -d + chdir: {{ path }} + register: run_info + changed_when: run_info.rc != 0 - name: Display run info ansible.builtin.debug: diff --git a/ansible/roles/stop/tasks/main.yml b/ansible/roles/stop/tasks/main.yml index 83e175f..4a3c6cf 100644 --- a/ansible/roles/stop/tasks/main.yml +++ b/ansible/roles/stop/tasks/main.yml @@ -1,5 +1,7 @@ - name: Stop module - ansible.builtin.shell: docker stop faces_service_{{ module_port }} + ansible.builtin.command: + cmd: docker compose down + chdir: {{ path }} register: stop_info - name: Display stop info diff --git a/docker-compose.yml b/docker-compose.yml index df14c29..db1b979 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -2,7 +2,7 @@ version: '3.8' services: master-node: build: - context: . + context: ./master-node dockerfile: ./master-node/Dockerfile ports: - "5010:5010" diff --git a/master-node/docker-compose.yml b/master-node/docker-compose.yml new file mode 100644 index 0000000..ec5af2a --- /dev/null +++ b/master-node/docker-compose.yml @@ -0,0 +1,8 @@ +version: '3.8' +services: + master-node: + build: + context: . + dockerfile: Dockerfile + ports: + - "5010:5010"