Watchmen GPU Scheduler

GPU Status

{% if 'hostname' in gpu_msg %}

{{ gpu_msg.hostname }} : {{ gpu_msg.query_time }}

{% for gpu in gpu_msg.gpus %} {% endfor %}
Index Name Temp Util Memory #Process
{{ gpu.index }} {{ gpu.name }} {{ gpu['temperature.gpu'] }} {{ gpu['utilization.gpu'] }} {{ gpu['memory.used'] }} / {{ gpu['memory.total'] }} {{ gpu.processes|length }}
{% else %}

{{ gpu_msg }}

{% endif %}

Working Queue Status

{% if work_msg.status == "ok" %} {% for client in work_msg.msg %} {% endfor %}
ID Mode GPU Scope Request GPU Num Queue Num Last Request Time Status
{{ client.id }} {{ client.mode }} {{ client.gpus }} {{ client.req_gpu_num }} {{ client.queue_num }} {{ client.last_request_time }} {% if client.status == "ok" %}

OK

{% elif client.status == "waiting" %}

Waiting

{% elif client.status == "timeout" %}

Timeout

{% endif %}
{% else %}

{{ work_msg }}

{% endif %}

Finished Queue Status

{% if finished_msg.status == "ok" %} {% for client in finished_msg.msg %} {% endfor %}
ID Mode Request GPU Num GPU Scope Available GPUs Queue Num Last Request Time Status
{{ client.id }} {{ client.mode }} {{ client.req_gpu_num }} {{ client.gpus }} {{ client.available_gpus }} {{ client.queue_num }} {{ client.last_request_time }} {% if client.status == "ok" %}

OK

{% elif client.status == "waiting" %}

Waiting

{% elif client.status == "timeout" %}

Timeout

{% endif %}
{% else %}

{{ finished_msg }}

{% endif %}